diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000000000000000000000000000000000000..52373fe24473b1aa44333d318f578ae6bf04b49b --- /dev/null +++ b/.gitattributes @@ -0,0 +1,36 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +tokenizer.json filter=lfs diff=lfs merge=lfs -text diff --git a/README.md b/README.md new file mode 100644 index 0000000000000000000000000000000000000000..08a1fb0d8da1afef9b0d4488cac2649eec7d7ed6 --- /dev/null +++ b/README.md @@ -0,0 +1,173 @@ +--- +tags: +- text-generation +- agent +- tool-use +- long-context +license: other +language: +- en +pipeline_tag: text-generation +--- + +
+ SII + ASI + +
+
+ Chat + + +
+ +# LIMI: Less is More for Agency + +[![arXiv](https://img.shields.io/badge/arXiv-2509.17567-b31b1b.svg)](https://arxiv.org/pdf/2509.17567) +[![GitHub](https://img.shields.io/badge/GitHub-Repository-green)](https://github.com/GAIR-NLP/LIMI) +[![Hugging Face](https://img.shields.io/badge/%F0%9F%A4%97%20Hugging%20Face-Dataset-blue)](https://huggingface.co/datasets/GAIR/LIMI) + +--- +To learn more about LIMI, feel free to explore our documentation and resources. Our release consists of the following sections: + +- **Model Zoo && Quick Start**: Basic usage and demonstrations with Transformers, vLLM, and SGLang for LIMI and LIMI-Air; +- **Evaluation**: Comprehensive evaluation suite with metrics for agentic capabilities assessment; +- **Prompting**: Usage of LIMI with frameworks for agentic applications, tool use, and reasoning tasks. + +## Overview + +LIMI is an agentic model fine‑tuned from [GLM‑4.5](https://huggingface.co/zai-org/GLM-4.5) using compact, high‑quality data to emphasize: + +- Targeted capabilities: tool use, multi‑turn correction, spec compliance +- Long‑context trajectory with tokenizer‑filtered samples +- OpenAI‑style `messages` with optional function/tool calls + +## Model Details + +- Base model: `zai-org/GLM-4.5` +- Training framework: slime +- Training data: curated conversations from [GAIR/LIMI](https://huggingface.co/datasets/GAIR/LIMI) + +## Performance on AgencyBench + +Our models achieve state-of-the-art performance across multiple agentic evaluation tasks: + +| Model | FTFC (↑) | RC@3 (↑) | SR@3 (↑) | Avg. | +|-------|----------|----------|----------|-----------------| +| GLM-4.5-Air | 15.0 | 16.1 | 20.0 | 17.0 | +| GLM-4.5 | 37.8 | 50.0 | 47.4 | 45.1 | +|GLM-4.5-CodeAgent| 48.0 | 48.0|47.5| 47.8| +| **LIMI-Air** | **35.4** | **34.3** | **33.1** | **34.3** | +| **LIMI** | **71.7** | **74.2** | **74.6** | **73.5** | + +For detailed benchmark results, experimental setup, and comprehensive comparisons, please refer to our [paper](https://arxiv.org/pdf/2509.17567). + +## Model Zoo + +Our LIMO model is available on Hugging Face 🤗: + +| Model | Backbone | Size | Link | +|---|---|---|---| +| LIMI | [GLM‑4.5](https://huggingface.co/zai-org/GLM-4.5) | 353B | https://huggingface.co/GAIR/LIMI | +| LIMI‑Air | [GLM‑4.5‑Air](https://huggingface.co/zai-org/GLM-4.5-Air) | 107B | https://huggingface.co/GAIR/LIMI-Air | + + +## Datasets + +We release our datasets through Hugging Face 🤗: +- Name: `GAIR/LIMI` +- Summary: curated agentic SFT data (OpenAI `messages`, optional `tools`, normalized tool‑call arguments); current release contains ~78 high‑quality samples. +- Link: https://huggingface.co/datasets/GAIR/LIMI + +## Quick Start + +
+Start with HF Transformers + +```python +from transformers import AutoModelForCausalLM, AutoTokenizer +import torch + +model = AutoModelForCausalLM.from_pretrained( + "GAIR/LIMI", torch_dtype="auto", device_map="auto", trust_remote_code=True +) +tok = AutoTokenizer.from_pretrained("GAIR/LIMI", trust_remote_code=True) + +messages = [ + {"role": "system", "content": "You are a helpful assistant tasked with discovering mathematical function structures for scientific systems."}, + {"role": "user", "content": "Modify the equation.py function, considering the physical meaning and relationships of the inputs."} +] + +text = tok.apply_chat_template(messages, tokenize=False, add_generation_prompt=True) +inputs = tok(text, return_tensors="pt").to(model.device) +out = model.generate( + **inputs, + max_new_tokens=4096, + temperature=0.6, + top_p=0.95, + do_sample=True, +) +print(tok.decode(out[0][inputs['input_ids'].shape[1]:], skip_special_tokens=True)) +``` + +
+ +
+Start with VLLM + +```python +from vllm import LLM, SamplingParams +from transformers import AutoTokenizer + +llm = LLM(model="GAIR/LIMI", trust_remote_code=True) +tok = AutoTokenizer.from_pretrained("GAIR/LIMI", trust_remote_code=True) +text = tok.apply_chat_template(messages, tokenize=False, add_generation_prompt=True) +out = llm.generate(text, SamplingParams(temperature=0.6, max_tokens=4096, top_p=0.95)) +print(out[0].outputs[0].text) +``` + +
+ +## Prompting + +- Messages follow OpenAI chat format; include a grounding system message when helpful. +- Example: + +```json +[ + {"role": "system", "content": "You are a helpful assistant tasked with discovering mathematical function structures for scientific systems."}, + {"role": "user", "content": "Modify the equation.py function, considering the physical meaning and relationships of the inputs."} +] +``` + +## Evaluation + +- We report FTFC (First‑Turn Functional Completeness), SR@R (Success Rate at R), and RC@R (Remaining Chances at R) with R=3. +- See the paper for experimental protocol and scores. + +## Limitations + +- May produce incorrect tool arguments or overfit to frequent schemas +- Not safety‑filtered for sensitive domains; use with guardrails and oversight + +## License + +- Inherits base model (GLM‑4.5) terms; verify upstream license before deployment + +## Citation + +```bibtex +@misc{xiao2025limiagency, + title={LIMI: Less is More for Agency}, + author={Yang Xiao and Mohan Jiang and Jie Sun and Keyu Li and Jifan Lin and Yumin Zhuang and Ji Zeng and Shijie Xia and Qishuo Hua and Xuefeng Li and Xiaojie Cai and Tongyu Wang and Yue Zhang and Liming Liu and Xia Wu and Jinlong Hou and Yuan Cheng and Wenjie Li and Xiang Wang and Dequan Wang and Pengfei Liu}, + year={2025}, + eprint={2509.17567}, + archivePrefix={arXiv}, + primaryClass={cs.AI}, + url={https://arxiv.org/abs/2509.17567}, +} +``` + diff --git a/assets/asi.png b/assets/asi.png new file mode 100644 index 0000000000000000000000000000000000000000..e3105400a6aac31fb13bc6a291beea935682f5f8 Binary files /dev/null and b/assets/asi.png differ diff --git a/assets/sii.jpg b/assets/sii.jpg new file mode 100644 index 0000000000000000000000000000000000000000..db144274da59427c8be0ca8c1fe380f972206666 Binary files /dev/null and b/assets/sii.jpg differ diff --git a/assets/teaser.jpg b/assets/teaser.jpg new file mode 100644 index 0000000000000000000000000000000000000000..7f5e08808d023905f41f7ec6a7c0e3ae9355921c --- /dev/null +++ b/assets/teaser.jpg @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e08c1ca91506c69729c2a4f66f50391e46fd6cb0998d98b035786d4273ac5a30 +size 232779 diff --git a/chat_template.jinja b/chat_template.jinja new file mode 100644 index 0000000000000000000000000000000000000000..41478957aca7a04b7321022e7d1f73de5badd995 --- /dev/null +++ b/chat_template.jinja @@ -0,0 +1,103 @@ +[gMASK] +{%- if tools -%} +<|system|> +# Tools + +You may call one or more functions to assist with the user query. + +You are provided with function signatures within XML tags: + +{% for tool in tools %} +{{ tool | tojson(ensure_ascii=False) }} +{% endfor %} + + +For each function call, output the function name and arguments within the following XML format: +{function-name} +{arg-key-1} +{arg-value-1} +{arg-key-2} +{arg-value-2} +... +{%- endif -%} +{%- macro visible_text(content) -%} + {%- if content is string -%} + {{- content }} + {%- elif content is iterable and content is not mapping -%} + {%- for item in content -%} + {%- if item is mapping and item.type == 'text' -%} + {{- item.text }} + {%- elif item is string -%} + {{- item }} + {%- endif -%} + {%- endfor -%} + {%- else -%} + {{- content }} + {%- endif -%} +{%- endmacro -%} +{%- set ns = namespace(last_user_index=-1) %} +{%- for m in messages %} + {%- if m.role == 'user' %} + {% set ns.last_user_index = loop.index0 -%} + {%- endif %} +{%- endfor %} +{% for m in messages %} +{%- if m.role == 'user' -%}<|user|> +{{ visible_text(m.content) }} +{{- '/nothink' if (enable_thinking is defined and not enable_thinking and not visible_text(m.content).endswith("/nothink")) else '' -}} +{%- elif m.role == 'assistant' -%} +<|assistant|> +{%- set reasoning_content = '' %} +{%- set content = visible_text(m.content) %} +{%- if m.reasoning_content is string %} + {%- set reasoning_content = m.reasoning_content %} +{%- else %} + {%- if '' in content %} + {%- set reasoning_content = content.split('')[0].rstrip('\n').split('')[-1].lstrip('\n') %} + {%- set content = content.split('')[-1].lstrip('\n') %} + {%- endif %} +{%- endif %} +{%- if loop.index0 > ns.last_user_index and reasoning_content -%} +{{ '\n' + reasoning_content.strip() + ''}} +{%- else -%} +{{ '\n' }} +{%- endif -%} +{%- if content.strip() -%} +{{ '\n' + content.strip() }} +{%- endif -%} +{% if m.tool_calls %} +{% for tc in m.tool_calls %} +{%- if tc.function %} + {%- set tc = tc.function %} +{%- endif %} +{{ '\n' + tc.name }} +{% set _args = tc.arguments %} +{% for k, v in _args.items() %} +{{ k }} +{{ v | tojson(ensure_ascii=False) if v is not string else v }} +{% endfor %} +{% endfor %} +{% endif %} +{%- elif m.role == 'tool' -%} +{%- if m.content is string -%} +{%- if loop.first or (messages[loop.index0 - 1].role != "tool") %} + {{- '<|observation|>' }} +{%- endif %} +{{- '\n\n' }} +{{- m.content }} +{{- '\n' }} +{%- else -%} +<|observation|>{% for tr in m.content %} + + +{{ tr.output if tr.output is defined else tr }} +{% endfor -%} +{% endif -%} +{%- elif m.role == 'system' -%} +<|system|> +{{ visible_text(m.content) }} +{%- endif -%} +{%- endfor -%} +{%- if add_generation_prompt -%} + <|assistant|>{{- '\n' if (enable_thinking is defined and not enable_thinking) else '' -}} +{%- endif -%} \ No newline at end of file diff --git a/config.json b/config.json new file mode 100644 index 0000000000000000000000000000000000000000..c8a792d99a36139dda07b552468252dc36873f32 --- /dev/null +++ b/config.json @@ -0,0 +1,43 @@ +{ + "architectures": [ + "Glm4MoeForCausalLM" + ], + "attention_bias": true, + "attention_dropout": 0.0, + "pad_token_id": 151329, + "eos_token_id": [ + 151329, + 151336, + 151338 + ], + "head_dim": 128, + "hidden_act": "silu", + "hidden_size": 5120, + "partial_rotary_factor": 0.5, + "initializer_range": 0.02, + "intermediate_size": 12288, + "max_position_embeddings": 131072, + "model_type": "glm4_moe", + "moe_intermediate_size": 1536, + "norm_topk_prob": true, + "num_attention_heads": 96, + "n_group": 1, + "topk_group": 1, + "n_routed_experts": 160, + "n_shared_experts": 1, + "routed_scaling_factor": 2.5, + "num_experts_per_tok": 8, + "first_k_dense_replace": 3, + "num_hidden_layers": 92, + "num_key_value_heads": 8, + "rms_norm_eps": 1e-05, + "rope_scaling": null, + "rope_theta": 1000000, + "num_nextn_predict_layers": 1, + "tie_word_embeddings": false, + "torch_dtype": "bfloat16", + "transformers_version": "4.54.0", + "use_cache": true, + "use_qk_norm": true, + "vocab_size": 151552 +} \ No newline at end of file diff --git a/generation_config.json b/generation_config.json new file mode 100644 index 0000000000000000000000000000000000000000..4d49113f3e19072368c98e53180331c77c07c8a6 --- /dev/null +++ b/generation_config.json @@ -0,0 +1,10 @@ +{ + "_from_model_config": true, + "eos_token_id": [ + 151329, + 151336, + 151338 + ], + "pad_token_id": 151329, + "transformers_version": "4.54.0" +} diff --git a/model-00000-of-00132.safetensors b/model-00000-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..87b178071457b39ac93f2c5d1886a314c4a40c1f --- /dev/null +++ b/model-00000-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d88229a6b90a56738069cea431ed1967a6f93c5d56f30dae467c9f210ad57c9f +size 5358375840 diff --git a/model-00001-of-00132.safetensors b/model-00001-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2da4dadf12c049cfd72f6c06d27e37f745a4f6f8 --- /dev/null +++ b/model-00001-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5bc48a72ccf9e99dd1316a4129a52619c690ec83bc00e403c26bb4fc0da63f2b +size 5354671176 diff --git a/model-00002-of-00132.safetensors b/model-00002-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3eba21e0105acbc82b501f29f8633282a531e26d --- /dev/null +++ b/model-00002-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78f16d09866b2554b46bb963b7bed68b4a172380dfe5df8c23bc7bb90ca052ea +size 5363508520 diff --git a/model-00003-of-00132.safetensors b/model-00003-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6654b0695d4f44017a42f017a3e3493a78e9aad1 --- /dev/null +++ b/model-00003-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4cd855e20ea4049a294a68b7d28268519d6b96868a76e98c2c530410043efe36 +size 5363548312 diff --git a/model-00004-of-00132.safetensors b/model-00004-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6744ccdbe72c552fc941fd33bfe13682db575bca --- /dev/null +++ b/model-00004-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1118e4f4bbb52e46bc6b3f6ec9d36cf7373b504a7e0341486ec4ecc37ca6a06e +size 5354671160 diff --git a/model-00005-of-00132.safetensors b/model-00005-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..17e949dbcfe42c48d26b9da7326d888f5ac885b1 --- /dev/null +++ b/model-00005-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2390f34fd1d401dcc014fe271c42aa36daea3177e71c85e0f57b90e921a9f0a +size 5363508568 diff --git a/model-00006-of-00132.safetensors b/model-00006-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..db61baa0a6dcd8f26131a6e6a44f9a5464b16103 --- /dev/null +++ b/model-00006-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2518fd9690d2d2a99d32b3208ba28295f552318cd549b0b72c0b6358e0762d52 +size 5363548312 diff --git a/model-00007-of-00132.safetensors b/model-00007-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5e2d975cc143219d550e58d38712302f01337421 --- /dev/null +++ b/model-00007-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f164a0adb406e02afa492be5bada2b465997cb272f2de379bb8851d34aca1e4f +size 5354671120 diff --git a/model-00008-of-00132.safetensors b/model-00008-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5a9c0b9fbcd8140fa336f954d85e361ef2a21ea4 --- /dev/null +++ b/model-00008-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dcd6b55fb86a2b1f08a3599b2d44ca8c6bb99225a5a185bec42a43d95c094bbf +size 5363508624 diff --git a/model-00009-of-00132.safetensors b/model-00009-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..283238bf5895981ee9cecb1aaa5eb8211ff7a55f --- /dev/null +++ b/model-00009-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:79638de3bb541caa92a60aa19224752fd4cd208b4350f463df478734ea673714 +size 5363548296 diff --git a/model-00010-of-00132.safetensors b/model-00010-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..fdbc4f5196312795f771e12e2360e9fe277fd4f8 --- /dev/null +++ b/model-00010-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a25a35c9b79f08338e3c7f9f3f8ab3a0f8c26f5b02f2548c2cf7b1b03338fce +size 5365186128 diff --git a/model-00011-of-00132.safetensors b/model-00011-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..52e18095a6e201d4cdc6ddebb84bb2c1ed56459b --- /dev/null +++ b/model-00011-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9f20b87ac7d3b68d406fa73b75f98f59cd4e2b94f22e03eac95ecf6d284d05c +size 5363509064 diff --git a/model-00012-of-00132.safetensors b/model-00012-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..73dd98f9ece681ced614f4abc58185f0f85eed72 --- /dev/null +++ b/model-00012-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7fc0eb0e4748e00b6b96f515ff319e1e2b640546e086c92043057aa568458b30 +size 5363519576 diff --git a/model-00013-of-00132.safetensors b/model-00013-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7a92520d53126947b3aff2e6f948e2c1e2c960c2 --- /dev/null +++ b/model-00013-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7bf3d0807df52fb59ed0a87805d23c77c57016808c38786e8ccca57bffecc447 +size 5365186280 diff --git a/model-00014-of-00132.safetensors b/model-00014-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8f4ca58f2314efa1a935562efe584e567e6e5ff2 --- /dev/null +++ b/model-00014-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da9e773d0169e6c2ddf3a590ea7bf6e352fb22e09912136940ce09fe1367e7f3 +size 5363519784 diff --git a/model-00015-of-00132.safetensors b/model-00015-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f57b1845e1606dd673c806c1ae5dc2b4b76f2519 --- /dev/null +++ b/model-00015-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9d6b61893cfe23c891a148ef2b466c819c3cf1b21660776a4a67f5832b8413f +size 5363508912 diff --git a/model-00016-of-00132.safetensors b/model-00016-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a909276d237252e3bc8edd5d7fa772cf920759c3 --- /dev/null +++ b/model-00016-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01e14fb11ccc0ad341a351eb0684c3aba0f94dfca60e1a7b3ca897e488f0fd91 +size 5365186272 diff --git a/model-00017-of-00132.safetensors b/model-00017-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..08a9746f8bf9f230645b43d480db691cbc7f6c3d --- /dev/null +++ b/model-00017-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04d55d74aa8d1e8f096546f6184be2d4b75eaf00e5af9bb399b34b0d021cc0d3 +size 5363519744 diff --git a/model-00018-of-00132.safetensors b/model-00018-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..fa1bfad8c13f38decd9791ed01664f7629dcc055 --- /dev/null +++ b/model-00018-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55013d2053638038f47d69546ae4c4de241860683b693bf839afcb097f222f31 +size 5363508976 diff --git a/model-00019-of-00132.safetensors b/model-00019-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..58fd85efe854fa537138b188df0343420a39e955 --- /dev/null +++ b/model-00019-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d820c68d8bca5015c7711b048536a9e1c848e0dcab983ce43377e5fac34b8741 +size 5365187000 diff --git a/model-00020-of-00132.safetensors b/model-00020-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..04d2c2766c0f7bdf1f078789a0385738e7fe9295 --- /dev/null +++ b/model-00020-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4706756c1fdf3fb1bced74c77ba0f6c71ae9205e266aa67aea989b4a6a805b22 +size 5363519688 diff --git a/model-00021-of-00132.safetensors b/model-00021-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..07cdc847d06674e38b926dab5fc55f502d466d51 --- /dev/null +++ b/model-00021-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ee704c04c024da2f3e4a07d8deeea91cac25ad1ae3429f4e1db202416b4725e +size 5365187176 diff --git a/model-00022-of-00132.safetensors b/model-00022-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f168330f459b3e4ff50c74132d096fe34418dd1e --- /dev/null +++ b/model-00022-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28bb37bc3f850326d8f470d1033f6e9a9b0bbaf824a0c588220722be11571fe5 +size 5363508840 diff --git a/model-00023-of-00132.safetensors b/model-00023-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..58073592c7f9939d9e584c3d5203d20630f8d262 --- /dev/null +++ b/model-00023-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:acd8c2ffe5c8f320e835f77c8ae69ea8760d7f89db0103f5a975fc9ad145fcdf +size 5353033000 diff --git a/model-00024-of-00132.safetensors b/model-00024-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b8f95ab8407a5547f1670abd9d5a30f8600e6d99 --- /dev/null +++ b/model-00024-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:959acbc893ff8fe117d27b668448f12c05a07e29b2969961e50bd60e19f410e2 +size 5354671496 diff --git a/model-00025-of-00132.safetensors b/model-00025-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9ca5f08bddaa36b40cac9dd4d4be418ed9b86be1 --- /dev/null +++ b/model-00025-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7389c496f0fd93cd0f4d21c5d7d296f23e899ff066bf34a5a700d76b1c9f0652 +size 5363508888 diff --git a/model-00026-of-00132.safetensors b/model-00026-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..01c1848d4ad1dbc106f9d2d593f9c9f5a738fce4 --- /dev/null +++ b/model-00026-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35ce81a674b5f754cc872d647115a8264c98e940cc2e75f0dc5f5882e342a0f5 +size 5363548656 diff --git a/model-00027-of-00132.safetensors b/model-00027-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..eb5cc50d1a0c29c113b876fd6139994981c58331 --- /dev/null +++ b/model-00027-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:228c4d3bab5fe24aebcaf841b3ab1d556e09783a5f8a37e08e1765e9e9215177 +size 5354671464 diff --git a/model-00028-of-00132.safetensors b/model-00028-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f6604a9a4112683e0733ed242b04bc8bab23fb04 --- /dev/null +++ b/model-00028-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f6f90af4b070f6e026e80cba2c959031d65fc6c93b1e86f2fc6b1665ce211f7 +size 5363508928 diff --git a/model-00029-of-00132.safetensors b/model-00029-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9a26a73ad1a9d93809ea60e8d3c27515140ffcf2 --- /dev/null +++ b/model-00029-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d0f96a957d134c733976d118c5b300ec72c5b4d79d2e74f2aa11e1512ecbf5f +size 5273906752 diff --git a/model-00030-of-00132.safetensors b/model-00030-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ad73d86e50551e4b6b584a98551cefa52c190001 --- /dev/null +++ b/model-00030-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:caeba0f0ffe3b35e79f679243e70081f15a503224428e8f4d6a6babddd0e83f8 +size 5359994840 diff --git a/model-00031-of-00132.safetensors b/model-00031-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..cfad944224e35d2e2bce069c7f8bd17e32faeb34 --- /dev/null +++ b/model-00031-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e71c016cc8e6a64032aaa3f7aca3595f1f46bab22f99284ee3aa125140ef3f02 +size 5365198640 diff --git a/model-00032-of-00132.safetensors b/model-00032-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..878ef926ceb6920c2b8a3c7f0048012d89167115 --- /dev/null +++ b/model-00032-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c8b84b2ec7f2c8dfb3049e2c9fd2ac4c9030565279594b8cb9cf837ef9205c0 +size 5353072712 diff --git a/model-00033-of-00132.safetensors b/model-00033-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..33c6a4c86cdcd1739579ce3bc833b9f1dc54385a --- /dev/null +++ b/model-00033-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12d88d66d8110d4a5cce568ceef88f8fe006d961bcb35d919c215872116399ba +size 5363508880 diff --git a/model-00034-of-00132.safetensors b/model-00034-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a53946381f173796d530cef3ccf67a80fcce3e15 --- /dev/null +++ b/model-00034-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36f88eb05cd013b87160be8cbfb67317ab0ecf43f49373cc8af4c1d18e70896d +size 5365198632 diff --git a/model-00035-of-00132.safetensors b/model-00035-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..490d31cbc4288d33b066f8ef35cbeb9731c33885 --- /dev/null +++ b/model-00035-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19f556cc2d441790060d215148a319118ac86599e33fa31be2c12d048ce295cb +size 5353072688 diff --git a/model-00036-of-00132.safetensors b/model-00036-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..cbbd03bcd0afbf6e987188d8dbf8a8ed332f766b --- /dev/null +++ b/model-00036-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20d52f0d67ad3b568911e2f167eb00be8c434025db14e4ba88bfdc2640cdaf27 +size 5363508920 diff --git a/model-00037-of-00132.safetensors b/model-00037-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..244f61419c0b39b296c8ebc82183b2110cf359b2 --- /dev/null +++ b/model-00037-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d378a924ab931b79ba3266feac386057d5ad22d8c98479022bec57f882186b0 +size 5365198632 diff --git a/model-00038-of-00132.safetensors b/model-00038-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..dc03f34029a745f1fea294fc20b4a84db5825ce5 --- /dev/null +++ b/model-00038-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25e33d9e8378a5f834ca3f505cd24f1da1f6aab2b7c1f09b110d204601966bee +size 5353072648 diff --git a/model-00039-of-00132.safetensors b/model-00039-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..819db9ef7894e01dd5c00b305c9529c86ad5e118 --- /dev/null +++ b/model-00039-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc5f657413508a3a6fb5d6624c90a38130eec242473c8dfa4440f8efe6ea8371 +size 5363508984 diff --git a/model-00040-of-00132.safetensors b/model-00040-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6be6788175ee41332bd9e6152f2df880b1fc3c07 --- /dev/null +++ b/model-00040-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3848e1fca798383ee1ad3fbec48a6521e9f7b2a91c75a7d08f825419fdad737 +size 5365198608 diff --git a/model-00041-of-00132.safetensors b/model-00041-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5f16ec3e1a33f47cf6fc01e47f7432a7d30accdc --- /dev/null +++ b/model-00041-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f1c51a660295ac03c54011ca8efed3aa017fab144ffb8040a03722cdff0c420 +size 5353072608 diff --git a/model-00042-of-00132.safetensors b/model-00042-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..42570d8297b15a637e22c1cc6a93fb83e47c1e11 --- /dev/null +++ b/model-00042-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64c44dc7a4794d37d347457547baed2d333b8f35cbe82814d28f31e5beb5979f +size 5365198784 diff --git a/model-00043-of-00132.safetensors b/model-00043-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..13c1bcf9190305c2a8dcfaea18e75156e8aacdd4 --- /dev/null +++ b/model-00043-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a507ea42ac3eba6490d118a427899f022481837b173b8493d3e49562995c403b +size 5363508840 diff --git a/model-00044-of-00132.safetensors b/model-00044-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..559b5013cf71814bcf748ed4a706d8932a54ff40 --- /dev/null +++ b/model-00044-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6704057e46edef17fe9c4d01a672ad7cdc321f327a7581748548537e90b1df69 +size 5353072584 diff --git a/model-00045-of-00132.safetensors b/model-00045-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d59b806e85005a4904b60c0be629d1769b44d5c9 --- /dev/null +++ b/model-00045-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b517edbec096c9d50272e1e7ccbf389aeb8085cf85a6b155f01e9e8e01e09a2 +size 5365198760 diff --git a/model-00046-of-00132.safetensors b/model-00046-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..30f98a19b55e6ee69ecfa82c80f9121d52b4b406 --- /dev/null +++ b/model-00046-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a622701d7a758131c8038b30320688d8e466f79f912350e1d11f2408d0356e4 +size 5363508904 diff --git a/model-00047-of-00132.safetensors b/model-00047-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..92f03c25010426a19697b1c1af0bef7c26fda1d4 --- /dev/null +++ b/model-00047-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59e89ee5a562c838527d5e8ce84f50120f190d7ac3844253499949f25609a6c4 +size 5353072568 diff --git a/model-00048-of-00132.safetensors b/model-00048-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..760ca764bc7de3efe5c93d7c2077686693af486b --- /dev/null +++ b/model-00048-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:171b48284b941a7ea4de084fd3c7cb4ef84091fa3ac4e4c22e4d792e2f398b16 +size 5365198744 diff --git a/model-00049-of-00132.safetensors b/model-00049-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..cac69d4e2d5b263049d5bb7f53910cab361dc2c6 --- /dev/null +++ b/model-00049-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c62ecf0d909f96268dbec49ab37f75a6f42bd1bb425297df47c1440b9e5d9da4 +size 5363508944 diff --git a/model-00050-of-00132.safetensors b/model-00050-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..965f60c5278f0df9c00d0c7814b60a2a5fbd8602 --- /dev/null +++ b/model-00050-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b321431df36827f65d869ea439350766dbe4141a4bded7075e943a119b402c5d +size 5353072560 diff --git a/model-00051-of-00132.safetensors b/model-00051-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5bf6578e28f91987431fc6269cffc9852b508967 --- /dev/null +++ b/model-00051-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e584a156d9898906a91f8be869d21ee6447aab991827779367a5b613a234058 +size 5365198704 diff --git a/model-00052-of-00132.safetensors b/model-00052-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..00879efb062b037b223222ec645e118ff3a03923 --- /dev/null +++ b/model-00052-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e5a5d0dbf4d05ec6dbf3510d52200d26d1e9c136876915625ba03ee2de46b71 +size 5363509024 diff --git a/model-00053-of-00132.safetensors b/model-00053-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c42b45b8fef507060535ec1efe12169ce5438a71 --- /dev/null +++ b/model-00053-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7cd09b6967bed2ea24ea639d2a8eb4c2dc88172b963f344898ed84ab89f6afc +size 5353072520 diff --git a/model-00054-of-00132.safetensors b/model-00054-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..827be75c5b940f311979638794396b6a8e858851 --- /dev/null +++ b/model-00054-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33a030d66cc999453e993a7bf04547e71cedee1e8bad45796fce1dd13ab420de +size 5365198664 diff --git a/model-00055-of-00132.safetensors b/model-00055-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..581c72762377d5f934cc4e93e725b67d7989de54 --- /dev/null +++ b/model-00055-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51595a112fd1a621d0d3129fd4f613629f392645687ba2dae4b93d10b3658e5b +size 5353072736 diff --git a/model-00056-of-00132.safetensors b/model-00056-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..61a5e4addd54b49214adc757e1c8932686594db1 --- /dev/null +++ b/model-00056-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54f31364a780be69e6ec885497768a280c29d12e07ddfe5b6ec22a583b447c76 +size 5363508840 diff --git a/model-00057-of-00132.safetensors b/model-00057-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ebae9a1f0f9b3280ca273ebbc8833ecdde98ab21 --- /dev/null +++ b/model-00057-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:283c4b28134aacd128a22a12fb9838bf6f6cc5c1e503f7b344ec8dc8ed6515a4 +size 5365198632 diff --git a/model-00058-of-00132.safetensors b/model-00058-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0c15fa41f1ae62dc4c90c171b34802efe8edda27 --- /dev/null +++ b/model-00058-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a9c936f7072529e10963c1383d828f2f2f97e4b52c38a4d36d5954125d45408 +size 5353072712 diff --git a/model-00059-of-00132.safetensors b/model-00059-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..91eac44fa7ce249fcf57d7bae83120bf6e753111 --- /dev/null +++ b/model-00059-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e9af47022ff2bf28a66c41e0bfd75bd81cec8062c7af96d62bc399118ac89f0 +size 5363508904 diff --git a/model-00060-of-00132.safetensors b/model-00060-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..808516ee36f5c5b660da58453e0d1e5d5f567e12 --- /dev/null +++ b/model-00060-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2cc33b97d4a5edb138c6c2653ec9e103daf1f13f0927a6e5899bc49ffd383ceb +size 5365198632 diff --git a/model-00061-of-00132.safetensors b/model-00061-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1685cef3d3fa7b6a117ba4784443a0471f3c7785 --- /dev/null +++ b/model-00061-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2407ef0e22c7ed127420272d8e2fe9dfe467da06350841781d08c2de7dd95f09 +size 5353072672 diff --git a/model-00062-of-00132.safetensors b/model-00062-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4857271d3f5206be57d188a56200c8ba12a76e48 --- /dev/null +++ b/model-00062-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6921886d8f5b8a9346484dd71c6a8a76ee2e0d32ca4690b621cbab0c181bb71c +size 5363508944 diff --git a/model-00063-of-00132.safetensors b/model-00063-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..cd13122095566d46ed063c20506c6e745a2aba61 --- /dev/null +++ b/model-00063-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:049f75ea0a1387d325aa402791862df95de364d78e4efaffee34aed56b38c255 +size 5367473224 diff --git a/model-00064-of-00132.safetensors b/model-00064-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9027c9cb5f089a1595663dd67cf614c837dc7499 --- /dev/null +++ b/model-00064-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a109d8709c18a0fc98297a89b5e4fb963415e3c74e4d933b4b30ea486a60f17e +size 5363508920 diff --git a/model-00065-of-00132.safetensors b/model-00065-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..714683f3fd2a887847b3b548b116e3b6d1c0aee3 --- /dev/null +++ b/model-00065-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a35c591f1e9c771e20aee15d3bf38de92dfa5ec5f455b27be67230e7812eb8c8 +size 5365198624 diff --git a/model-00066-of-00132.safetensors b/model-00066-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7f47a3c15d3c9d006add5465752b7b3120d938bd --- /dev/null +++ b/model-00066-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:354c80ff99242745c66c686d465568ed9a3d74902eab70e7bd8e3afc922982ca +size 5353072656 diff --git a/model-00067-of-00132.safetensors b/model-00067-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..dca4832843e1d76e4f1363abf877634eddac4327 --- /dev/null +++ b/model-00067-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bea1434249b2544c21d4d449f19e08d5a644b589561a86965f86a8fde5302c7a +size 5363508984 diff --git a/model-00068-of-00132.safetensors b/model-00068-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..373a398480b66a0bb2271a0d0dc6f3e12ed165d9 --- /dev/null +++ b/model-00068-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b4d78e658de7ccf2e393f90c112f84d3e09a6516f4dcae44626554037a25c12 +size 5365198608 diff --git a/model-00069-of-00132.safetensors b/model-00069-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..416d467987f31668d74286940132190640eace59 --- /dev/null +++ b/model-00069-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4226cb7b205a984cab101def9e5c40c0767e07fb23d04d1abdb44e677528d8f4 +size 5353072616 diff --git a/model-00070-of-00132.safetensors b/model-00070-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..630e03ef707c2463a0422cf6112df6b0028e3e9d --- /dev/null +++ b/model-00070-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d632cfb99c95a402be4935758ae145960e7200b0acff40d42e51a1a8bc900dc2 +size 5363509064 diff --git a/model-00071-of-00132.safetensors b/model-00071-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4c4671691264c0c0c5eca0b446e8573bf8b5c6e0 --- /dev/null +++ b/model-00071-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb01c41931c505830c624e4c7c102fc5027c93b72ca6c56bfc09dacdcc79eedd +size 5365198552 diff --git a/model-00072-of-00132.safetensors b/model-00072-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7aa600623f2918327d22a2e4dbba376cb23fafb7 --- /dev/null +++ b/model-00072-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7003da69597c0f816a503e25eb42c32e71bebcc34109218bc1f1ac7bce4f14e8 +size 5353072584 diff --git a/model-00073-of-00132.safetensors b/model-00073-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ecb5395f16c8fc9cfaa278ac012616a59dff4a0d --- /dev/null +++ b/model-00073-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a3e5365a3a07f38ec2ec81da4db46fb0118b3101196c6a68187357a455b02f5 +size 5365198760 diff --git a/model-00074-of-00132.safetensors b/model-00074-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d879c03b1b8ff2eebae83f2576bb1dc37530b381 --- /dev/null +++ b/model-00074-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6fae12a3264525e8181044eafd6e91c4aad884efb36f68309bd2a9ab88b02c9f +size 5363508896 diff --git a/model-00075-of-00132.safetensors b/model-00075-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7cbe30a2bc85928902a94fd62bb020e9bf191fa1 --- /dev/null +++ b/model-00075-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c3a4928ac07234b82af99165484cc390146cef56d6474ce0f6e5128433656a1 +size 5353072568 diff --git a/model-00076-of-00132.safetensors b/model-00076-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f1524c9ef12a5bb77d120f2ab9a76717ff7198fe --- /dev/null +++ b/model-00076-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a19bdcbaf58680e7ed0eb2a5aed4e134d68201e1773dc2c5a33c8d74104a1bda +size 5365198744 diff --git a/model-00077-of-00132.safetensors b/model-00077-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..cac825f16cd7dff76cbab2aa063e991d0fb7436e --- /dev/null +++ b/model-00077-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dac39de203aba28bff75b8e49510981000ca967d11431286623fa0623554d20e +size 5363508936 diff --git a/model-00078-of-00132.safetensors b/model-00078-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6ee0710bd4f7a44ccb758fc8e45d297855009d2f --- /dev/null +++ b/model-00078-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e69877e62e1513fd69b11d1ad5f3d9b42a2cf690a21d70225637c710e4287c2 +size 5353072560 diff --git a/model-00079-of-00132.safetensors b/model-00079-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..561e8af56066e69cc15f798e1c5ce613151965e0 --- /dev/null +++ b/model-00079-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b35a4a4f2dfe021bb8218ec32b9794bc474974ccca73818792f7e84ab747bbcc +size 5365198704 diff --git a/model-00080-of-00132.safetensors b/model-00080-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c144c7403531f31b4f636d33093703bdbe73bd64 --- /dev/null +++ b/model-00080-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38a386b379e875297c451370fa5802ad069a098e1ac1417fd934c11d20a2f0f8 +size 5363509016 diff --git a/model-00081-of-00132.safetensors b/model-00081-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..76eb233170818d0d9d739d592b4f593d2c7a5bfe --- /dev/null +++ b/model-00081-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24541348449097b6923940dec92ab5ee7457e0463deb98d891a255d3d21e9467 +size 5353072520 diff --git a/model-00082-of-00132.safetensors b/model-00082-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8440011abde75cb02df51f7f54012335fe5a6e96 --- /dev/null +++ b/model-00082-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de2de3ae09ef0acbe2ed061ec9836a6db0a6598b19b358f0b42004192107ad9a +size 5365198664 diff --git a/model-00083-of-00132.safetensors b/model-00083-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d56259a7d3fcf16437e77f224bcc6d37addb1a10 --- /dev/null +++ b/model-00083-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0cd30d1d1d0e8b0d388224b5de3e124c89385fefa292e832767422d60aedd094 +size 5358274768 diff --git a/model-00084-of-00132.safetensors b/model-00084-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6d7b0f2839b55d7e08f2b2c53f51f592e5fb6e56 --- /dev/null +++ b/model-00084-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dafc08f24acf2025a0e798df536af2f383db725d752fc3f680674032a87e0a70 +size 5358306800 diff --git a/model-00085-of-00132.safetensors b/model-00085-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..667ba29258a5a83a4b57785eae2b2ad0f919dbaf --- /dev/null +++ b/model-00085-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46e8667617f1056f3e47536a340bcf119d85165549e3aeec2293cdc7861ab79d +size 5365198632 diff --git a/model-00086-of-00132.safetensors b/model-00086-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a2da12cf37eb43c298cd46d1039764b3dc617dea --- /dev/null +++ b/model-00086-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7225c522fb0e5ec2602eb0dcf3c86b3b1546964ccb7c4221e9e06d351128bff +size 5353072712 diff --git a/model-00087-of-00132.safetensors b/model-00087-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7dad68d00d865aefb2292238e527a51d5e148d04 --- /dev/null +++ b/model-00087-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56d33efda9360c3e657b41f14f2e01477d9a8c8190da6ce8b0cf3fd7d6f89aea +size 5363508896 diff --git a/model-00088-of-00132.safetensors b/model-00088-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..764e485274b3460677adabd7b2c47cf12af99316 --- /dev/null +++ b/model-00088-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c51b6ec7350df600a82df1617a200a8cae2dd705836605a5d2df325c35ecbfd6 +size 5365198632 diff --git a/model-00089-of-00132.safetensors b/model-00089-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..73fa596359091bb1946c444219188db132a3b72d --- /dev/null +++ b/model-00089-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3bb2dad0b578e2fac588d1cbcb4a97019ffa47a0d91444147ccd9824d05e34c +size 5353072680 diff --git a/model-00090-of-00132.safetensors b/model-00090-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c8bd16e34fc7bfaca4f7444e6da1eb61c1f06f1d --- /dev/null +++ b/model-00090-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64b7df26b1fe08e7123bd11ce6f73ff8d17115aff95cbe8bc2cf89665420131b +size 5363508936 diff --git a/model-00091-of-00132.safetensors b/model-00091-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4cfea0b12d52e2ff598823801d0de9339744d744 --- /dev/null +++ b/model-00091-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77d195b2ee6e465a397c8f32faa65b79096509295762249a36dd167bec318d0f +size 5365198632 diff --git a/model-00092-of-00132.safetensors b/model-00092-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..267e71b4d25f560f871695ffb10be0c163edb06b --- /dev/null +++ b/model-00092-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97ffceb5e5d3d63c43ee38de5e60fb67fb0f97a19f08c2ac3464e61a2faa41ad +size 5353072640 diff --git a/model-00093-of-00132.safetensors b/model-00093-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8be10746900cabe34e591a0266bddca87f678317 --- /dev/null +++ b/model-00093-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5aa6ed1fd806e49553935f54049fc2f8234ff4f9f14a5cb6f6aec381d7a816bd +size 5363509016 diff --git a/model-00094-of-00132.safetensors b/model-00094-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5372b2c281f398d4e76198153af618c1a3e4c8a8 --- /dev/null +++ b/model-00094-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7de26ac06ac272bb773ac44e364abaf5bf23b53d99068d396208bec6f26aaf58 +size 5365198592 diff --git a/model-00095-of-00132.safetensors b/model-00095-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..516e526c432a93767287644aba4546260e6b063d --- /dev/null +++ b/model-00095-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3176cd0385b86fe6d55b98fba5b79225af20fbf104e591988d296288d68f3b86 +size 5353072600 diff --git a/model-00096-of-00132.safetensors b/model-00096-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..fa58d558a3df1c5314a44afe71b10aa0deac6c0e --- /dev/null +++ b/model-00096-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb9ddb70ad04015488d66cc5c1a53f664a37de437ec7804265d3348313123867 +size 5255045368 diff --git a/model-00097-of-00132.safetensors b/model-00097-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4c4caa9419989b64683a08575270424c11d2a329 --- /dev/null +++ b/model-00097-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:647cf1925d26cc1ff1a5985f71612c7283e807ffa450762472f460bd3e0a9346 +size 5360542384 diff --git a/model-00098-of-00132.safetensors b/model-00098-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5b2d4fb2074d694afabff35ea35bd15739f4a281 --- /dev/null +++ b/model-00098-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eeed2494c1685af548eea1cfc2d859a9edb2ef9387f09414709b820d909a32ca +size 5363509040 diff --git a/model-00099-of-00132.safetensors b/model-00099-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..cff0676b8d5b41473ac9dca419dfa9be5afcd168 --- /dev/null +++ b/model-00099-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52a9dd8e513431a3bef2bcf698de6d6a47ff99e845a890a7222d040cd82e154e +size 5363509216 diff --git a/model-00100-of-00132.safetensors b/model-00100-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..91f8486d3ebb7ad9afa6a998d66c8e6f5598451e --- /dev/null +++ b/model-00100-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebc10f904875282d3a16cd8784d8c7bcb8763bfdebf524782cc63227de592530 +size 5365147672 diff --git a/model-00101-of-00132.safetensors b/model-00101-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..82a3b2bab9ad54e1aba64b71f638dbf767ae2b3a --- /dev/null +++ b/model-00101-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04ebf280f59e0ade4488111c01ee2080ce8b50981fd9e41e41188f7c9b638de7 +size 5363538424 diff --git a/model-00102-of-00132.safetensors b/model-00102-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..fc085e1a5db1242956b2a079db137495227b1c6a --- /dev/null +++ b/model-00102-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8473901a42cb718ffae05bbf645c8d19b9da0fb8c307c7854064e778d114b398 +size 5363508904 diff --git a/model-00103-of-00132.safetensors b/model-00103-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9f3e8e87cef20e029dd3f18135f4470a969300d9 --- /dev/null +++ b/model-00103-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:887531f7c25c27e14f20a49c2b27cd8c8ddb244eb74f427ef83c72d9e77ebb9a +size 5365147656 diff --git a/model-00104-of-00132.safetensors b/model-00104-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..251bbb980e59fefdcecdeb02cda21fbf5e018acf --- /dev/null +++ b/model-00104-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc1ce34f63071bb42f922b877855c3ce94fd0439d91ec95df579cfc3087c0399 +size 5363538392 diff --git a/model-00105-of-00132.safetensors b/model-00105-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a282123cf59d0e4cfbd9a6f3e79b2b1116b73ae1 --- /dev/null +++ b/model-00105-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa54cf7104dab352eb8272a2af7865bbf98befecc96c9b1ca7b92de78e21397e +size 5363508960 diff --git a/model-00106-of-00132.safetensors b/model-00106-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f36fbd02adca3059860ed66c44b4004f5b2aff24 --- /dev/null +++ b/model-00106-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0c85f4f983e3d5fb811ffa8903c2e4089019ec516883b8f8eed8cd282cb6c3f +size 5365147640 diff --git a/model-00107-of-00132.safetensors b/model-00107-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ea0f8c34a47eeba6e023d9ac6dde5bf35a1c8d43 --- /dev/null +++ b/model-00107-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e820646335f567fda6e952ef59cc57b2f0368fb38b33c6ca2a5bf9b6835f4de +size 5363538344 diff --git a/model-00108-of-00132.safetensors b/model-00108-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f39badbd510b3a0eb90bee1fa2fb741573b95feb --- /dev/null +++ b/model-00108-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:352ac295287df943584abc0548821ad922ffaf5f276053199d07b6d5bfb6961b +size 5363509064 diff --git a/model-00109-of-00132.safetensors b/model-00109-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..00037a6c81a72d4525c6d7ed696de751740c629a --- /dev/null +++ b/model-00109-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15180a03e8ff5857e15e7ed135b2e21d99c417aafb78f27490489d6f6d1fcef8 +size 5365147576 diff --git a/model-00110-of-00132.safetensors b/model-00110-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..338d0fa1461b6d95bbf629cec3637f3489724de7 --- /dev/null +++ b/model-00110-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f54852265e41bd51e757f177347425629f71b1bb269bd85a76d31a1626e3cb9 +size 5363538304 diff --git a/model-00111-of-00132.safetensors b/model-00111-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ca7741eac2ada1add6366772ee736d4b18b1e67c --- /dev/null +++ b/model-00111-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:adbf34540c73c0ce7c0d188aa07a4bf61bc0be53f6796908ac9ebea070901d6a +size 5365147792 diff --git a/model-00112-of-00132.safetensors b/model-00112-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..86e9da01e81134a4ffbbd39faa7b05be3f2537e6 --- /dev/null +++ b/model-00112-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b558d2a4eb39c28732a70a992e5ed90903fe81bf96718edfe314953003d4116 +size 5363508904 diff --git a/model-00113-of-00132.safetensors b/model-00113-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..762f9d9a6e8b867673cc462a3fabd898e672b62e --- /dev/null +++ b/model-00113-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d04f0d3ab4759c30dd9feab23abef6a5fb4fb68e90ca5e2b749828d85aecada9 +size 5353051632 diff --git a/model-00114-of-00132.safetensors b/model-00114-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7d8e64d34c39fc87688dea3231df092862786cee --- /dev/null +++ b/model-00114-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d4071546e482206984fa8bd4c11a56a767ad74d35f6508395904f698b438cc3 +size 5365147760 diff --git a/model-00115-of-00132.safetensors b/model-00115-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..035beda0c5d79e5d945374c244230ed7f06a9535 --- /dev/null +++ b/model-00115-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a0d2d96842e1038521153c2103921223fbe350ec7cf346dd2c246a6e35bc88a +size 5363508944 diff --git a/model-00116-of-00132.safetensors b/model-00116-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a2d9a9d600fc8e5f10f53d041d38944569fd3330 --- /dev/null +++ b/model-00116-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a388038af4c973a51c43bcee418085c4f0bc42b809c3c9e366e4e406580cede1 +size 5353051632 diff --git a/model-00117-of-00132.safetensors b/model-00117-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9fd31681346cffc3558744e67c24a162f055f3cd --- /dev/null +++ b/model-00117-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4502fdc863c106d15857299459fc2a286f6c8f855370a766f30f00555997b0b6 +size 5365147720 diff --git a/model-00118-of-00132.safetensors b/model-00118-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d48e071b7d3c4d6a149da06717ae2c5154022328 --- /dev/null +++ b/model-00118-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea12e0c84743b981cf7bed310ea43ec34ac5077ac6dbbab5b76bc4301a086528 +size 5363509024 diff --git a/model-00119-of-00132.safetensors b/model-00119-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6392e6d358ddd12f0182f7eb7ea1258388a1e4c0 --- /dev/null +++ b/model-00119-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d84ba893f42a39db8d4f4a726564ec3b3f3d0b97cceb40b7afb5d1bddcdc07f +size 5353061936 diff --git a/model-00120-of-00132.safetensors b/model-00120-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..fd3f1815fc86c1be9a06093ec90b11cf0bb1ab9b --- /dev/null +++ b/model-00120-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa3b6906f239951274b434a7cc8b91a0e56aaa223644e42057904db318797c76 +size 5365158032 diff --git a/model-00121-of-00132.safetensors b/model-00121-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8bbe48ed32a1113a08a3139559510b3d6b62e7d3 --- /dev/null +++ b/model-00121-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:876f88f7b3be1276c6882054ee0a8c0275509fb498aec27e232d766367ea5c26 +size 5353062136 diff --git a/model-00122-of-00132.safetensors b/model-00122-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7e2a9a4a857ae4d9ddcae544e37778361f4d24e7 --- /dev/null +++ b/model-00122-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2ff644259bf2941bb144a0f3b55601621410bb8d4502c71cc22f4a8a6862b51 +size 5363508864 diff --git a/model-00123-of-00132.safetensors b/model-00123-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..03c13614b75fa4cb1d94166b9f236041dd8695e9 --- /dev/null +++ b/model-00123-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5c61e555b177ab7d79254b140d3d2f326ebac9963822d3f81b38dc6ce4cb7ca +size 5365158000 diff --git a/model-00124-of-00132.safetensors b/model-00124-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..91fd50616db452615e9a65cc7865596e118f9fba --- /dev/null +++ b/model-00124-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:549a8d5d9c457f7eaab2c5a84432c18490cf75344daa43cce5987b947c1fd30f +size 5353062120 diff --git a/model-00125-of-00132.safetensors b/model-00125-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b275c252388ec94f6c84610f07221d9cbec2e0f0 --- /dev/null +++ b/model-00125-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3cc8cfb4edde239d38ee72d2539fecd6f53b43b9e37c63e41617227d3f577507 +size 5363508912 diff --git a/model-00126-of-00132.safetensors b/model-00126-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7723bb3546db9d07daea45b38d9b78b344cd74b4 --- /dev/null +++ b/model-00126-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d5de838b5f537a76685801a2626780910dfb6715f7b09356e051ef86fde26cc +size 5365158000 diff --git a/model-00127-of-00132.safetensors b/model-00127-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4eff7cc6cd6439f3ee6d60dfbf98e627c9652f68 --- /dev/null +++ b/model-00127-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a87a2a1ef862dacb26a76b18677b9e0b91bd722919d5370cb9361283d962588 +size 5353062080 diff --git a/model-00128-of-00132.safetensors b/model-00128-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8fdd3c39830a7470ec88768c15eeab0b88320547 --- /dev/null +++ b/model-00128-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:426a25e514a80d91ad3b1ab852fe55ebf3931c4cc22438a0f235ec4dbba9aee4 +size 5363508960 diff --git a/model-00129-of-00132.safetensors b/model-00129-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..974915dc3e3f6ec2e044b6c5f9ed84420cc455ac --- /dev/null +++ b/model-00129-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:969ea268c097b13478612ff39c920a1df970cf55032fc57835b50d56aaecc4d0 +size 5365157992 diff --git a/model-00130-of-00132.safetensors b/model-00130-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6e5b0ce66432f421d2d1362797c620e8631aa3b9 --- /dev/null +++ b/model-00130-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1603932d7b39498887b0e69bb948c219a34d3b20a0ce30f07fc85787e72e8b1e +size 5345949928 diff --git a/model-00131-of-00132.safetensors b/model-00131-of-00132.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b6fa978c15f520904b80aa562df6ac10f77c8cae --- /dev/null +++ b/model-00131-of-00132.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46263ecb3ad26f3f544ba45addd95319b19852ffdab1125f6f9ed5355dd2ae87 +size 3487825680 diff --git a/model.safetensors.index.json b/model.safetensors.index.json new file mode 100644 index 0000000000000000000000000000000000000000..20a01b5c246c7e1f82f8b1dafb4685680c3f8b8c --- /dev/null +++ b/model.safetensors.index.json @@ -0,0 +1,44196 @@ +{ + "metadata": { + "total_size": 705595686528 + }, + "weight_map": { + "model.embed_tokens.weight": "model-00000-of-00132.safetensors", + "model.layers.0.self_attn.q_proj.bias": "model-00000-of-00132.safetensors", + "model.layers.0.self_attn.k_proj.bias": "model-00000-of-00132.safetensors", + "model.layers.0.self_attn.v_proj.bias": "model-00000-of-00132.safetensors", + "model.layers.0.self_attn.q_norm.weight": "model-00000-of-00132.safetensors", + "model.layers.0.self_attn.k_norm.weight": "model-00000-of-00132.safetensors", + "model.layers.0.post_attention_layernorm.weight": "model-00000-of-00132.safetensors", + "model.layers.0.mlp.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.0.mlp.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.0.mlp.down_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.1.self_attn.q_norm.weight": "model-00000-of-00132.safetensors", + "model.layers.1.post_attention_layernorm.weight": "model-00000-of-00132.safetensors", + "model.layers.1.mlp.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.1.mlp.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.1.mlp.down_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.2.self_attn.q_proj.bias": "model-00000-of-00132.safetensors", + "model.layers.2.self_attn.k_proj.bias": "model-00000-of-00132.safetensors", + "model.layers.2.self_attn.v_proj.bias": "model-00000-of-00132.safetensors", + "model.layers.2.self_attn.q_norm.weight": "model-00000-of-00132.safetensors", + "model.layers.2.post_attention_layernorm.weight": "model-00000-of-00132.safetensors", + "model.layers.2.mlp.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.2.mlp.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.2.mlp.down_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.self_attn.q_proj.bias": "model-00000-of-00132.safetensors", + "model.layers.3.self_attn.k_proj.bias": "model-00000-of-00132.safetensors", + "model.layers.3.self_attn.v_proj.bias": "model-00000-of-00132.safetensors", + "model.layers.3.self_attn.q_norm.weight": "model-00000-of-00132.safetensors", + "model.layers.3.post_attention_layernorm.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.0.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.0.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.1.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.1.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.2.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.2.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.3.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.3.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.4.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.4.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.5.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.5.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.6.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.6.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.7.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.7.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.8.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.8.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.9.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.9.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.10.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.10.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.11.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.11.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.12.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.12.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.13.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.13.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.14.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.14.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.15.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.15.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.16.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.16.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.17.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.17.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.18.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.18.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.19.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.19.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.20.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.20.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.21.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.21.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.22.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.22.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.23.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.23.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.24.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.24.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.25.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.25.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.26.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.26.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.27.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.27.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.28.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.28.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.29.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.29.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.30.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.30.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.31.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.31.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.32.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.32.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.33.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.33.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.34.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.34.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.35.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.35.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.36.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.36.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.37.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.37.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.38.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.38.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.39.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.39.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.40.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.40.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.41.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.41.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.42.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.42.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.43.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.43.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.44.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.44.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.45.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.45.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.46.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.46.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.47.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.47.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.48.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.48.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.49.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.49.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.50.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.50.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.51.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.51.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.52.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.52.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.53.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.53.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.54.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.54.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.55.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.55.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.56.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.56.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.57.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.57.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.58.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.58.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.59.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.59.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.60.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.60.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.61.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.61.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.62.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.62.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.63.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.63.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.64.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.64.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.65.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.65.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.66.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.66.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.67.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.67.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.68.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.68.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.69.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.69.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.70.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.70.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.71.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.71.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.72.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.72.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.73.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.73.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.74.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.74.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.75.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.75.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.76.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.76.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.77.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.77.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.78.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.78.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.79.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.79.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.80.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.80.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.81.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.81.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.82.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.82.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.83.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.83.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.84.gate_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.84.up_proj.weight": "model-00000-of-00132.safetensors", + "model.layers.3.mlp.experts.85.gate_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.85.up_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.86.gate_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.86.up_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.87.gate_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.87.up_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.88.gate_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.88.up_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.89.gate_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.89.up_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.90.gate_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.90.up_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.91.gate_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.91.up_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.92.gate_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.92.up_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.93.gate_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.93.up_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.94.gate_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.94.up_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.95.gate_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.95.up_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.96.gate_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.96.up_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.97.gate_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.97.up_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.98.gate_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.98.up_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.99.gate_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.99.up_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.100.gate_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.100.up_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.101.gate_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.101.up_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.102.gate_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.102.up_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.103.gate_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.103.up_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.104.gate_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.104.up_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.105.gate_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.105.up_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.106.gate_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.106.up_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.107.gate_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.107.up_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.108.gate_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.108.up_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.109.gate_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.109.up_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.110.gate_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.110.up_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.111.gate_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.111.up_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.112.gate_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.112.up_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.113.gate_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.113.up_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.114.gate_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.114.up_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.115.gate_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.115.up_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.116.gate_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.116.up_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.117.gate_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.117.up_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.118.gate_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.118.up_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.119.gate_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.119.up_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.120.gate_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.120.up_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.121.gate_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.121.up_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.122.gate_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.122.up_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.123.gate_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.123.up_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.124.gate_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.124.up_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.125.gate_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.125.up_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.126.gate_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.126.up_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.127.gate_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.127.up_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.128.gate_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.128.up_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.129.gate_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.129.up_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.130.gate_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.130.up_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.131.gate_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.131.up_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.132.gate_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.132.up_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.133.gate_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.133.up_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.134.gate_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.134.up_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.135.gate_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.135.up_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.136.gate_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.136.up_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.137.gate_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.137.up_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.138.gate_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.138.up_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.139.gate_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.139.up_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.140.gate_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.140.up_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.141.gate_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.141.up_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.142.gate_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.142.up_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.143.gate_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.143.up_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.144.gate_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.144.up_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.145.gate_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.145.up_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.146.gate_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.146.up_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.147.gate_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.147.up_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.148.gate_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.148.up_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.149.gate_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.149.up_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.150.gate_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.150.up_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.151.gate_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.151.up_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.152.gate_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.152.up_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.153.gate_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.153.up_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.154.gate_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.154.up_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.155.gate_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.155.up_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.156.gate_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.156.up_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.157.gate_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.157.up_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.158.gate_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.158.up_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.159.gate_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.159.up_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.0.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.1.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.2.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.3.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.4.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.5.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.6.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.7.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.8.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.9.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.10.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.11.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.12.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.13.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.14.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.15.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.16.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.17.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.18.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.19.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.20.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.21.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.22.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.23.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.24.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.25.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.26.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.27.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.28.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.29.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.30.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.31.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.32.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.33.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.34.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.35.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.36.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.37.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.38.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.39.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.40.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.41.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.42.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.43.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.44.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.45.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.46.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.47.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.48.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.49.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.50.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.51.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.52.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.53.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.54.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.55.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.56.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.57.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.58.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.59.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.60.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.61.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.62.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.63.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.64.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.65.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.66.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.67.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.68.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.69.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.70.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.71.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.72.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.73.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.74.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.75.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.76.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.77.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.78.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.79.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.80.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.81.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.82.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.83.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.84.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.85.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.86.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.87.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.88.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.89.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.90.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.91.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.92.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.93.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.94.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.95.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.96.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.97.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.98.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.99.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.100.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.101.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.102.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.103.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.104.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.105.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.106.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.107.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.108.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.109.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.110.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.111.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.112.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.113.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.114.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.115.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.116.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.117.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.118.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.119.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.120.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.121.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.122.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.123.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.124.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.125.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.126.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.127.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.128.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.129.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.130.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.131.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.132.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.133.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.134.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.135.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.136.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.137.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.138.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.139.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.140.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.141.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.142.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.143.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.144.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.145.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.146.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.147.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.148.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.149.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.150.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.151.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.152.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.153.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.154.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.155.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.156.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.157.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.158.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.experts.159.down_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.shared_experts.gate_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.3.mlp.shared_experts.up_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.4.self_attn.o_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.4.self_attn.q_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.4.self_attn.k_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.4.self_attn.v_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.4.self_attn.q_norm.weight": "model-00001-of-00132.safetensors", + "model.layers.4.post_attention_layernorm.weight": "model-00001-of-00132.safetensors", + "model.layers.4.mlp.gate.weight": "model-00001-of-00132.safetensors", + "model.layers.4.mlp.gate.e_score_correction_bias": "model-00001-of-00132.safetensors", + "model.layers.4.mlp.experts.0.gate_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.4.mlp.experts.0.up_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.4.mlp.experts.1.gate_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.4.mlp.experts.1.up_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.4.mlp.experts.2.gate_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.4.mlp.experts.2.up_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.4.mlp.experts.3.gate_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.4.mlp.experts.3.up_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.4.mlp.experts.4.gate_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.4.mlp.experts.4.up_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.4.mlp.experts.5.gate_proj.weight": "model-00001-of-00132.safetensors", + "model.layers.4.mlp.experts.5.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.6.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.6.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.7.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.7.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.8.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.8.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.9.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.9.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.10.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.10.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.11.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.11.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.12.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.12.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.13.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.13.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.14.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.14.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.15.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.15.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.16.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.16.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.17.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.17.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.18.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.18.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.19.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.19.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.20.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.20.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.21.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.21.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.22.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.22.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.23.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.23.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.24.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.24.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.25.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.25.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.26.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.26.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.27.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.27.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.28.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.28.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.29.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.29.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.30.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.30.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.31.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.31.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.32.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.32.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.33.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.33.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.34.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.34.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.35.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.35.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.36.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.36.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.37.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.37.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.38.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.38.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.39.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.39.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.40.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.40.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.41.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.41.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.42.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.42.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.43.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.43.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.44.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.44.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.45.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.45.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.46.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.46.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.47.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.47.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.48.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.48.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.49.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.49.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.50.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.50.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.51.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.51.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.52.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.52.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.53.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.53.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.54.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.54.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.55.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.55.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.56.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.56.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.57.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.57.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.58.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.58.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.59.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.59.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.60.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.60.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.61.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.61.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.62.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.62.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.63.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.63.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.64.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.64.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.65.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.65.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.66.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.66.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.67.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.67.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.68.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.68.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.69.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.69.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.70.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.70.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.71.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.71.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.72.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.72.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.73.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.73.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.74.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.74.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.75.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.75.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.76.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.76.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.77.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.77.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.78.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.78.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.79.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.79.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.80.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.80.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.81.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.81.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.82.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.82.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.83.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.83.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.84.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.84.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.85.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.85.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.86.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.86.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.87.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.87.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.88.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.88.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.89.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.89.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.90.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.90.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.91.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.91.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.92.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.92.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.93.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.93.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.94.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.94.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.95.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.95.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.96.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.96.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.97.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.97.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.98.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.98.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.99.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.99.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.100.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.100.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.101.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.101.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.102.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.102.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.103.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.103.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.104.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.104.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.105.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.105.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.106.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.106.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.107.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.107.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.108.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.108.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.109.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.109.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.110.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.110.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.111.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.111.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.112.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.112.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.113.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.113.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.114.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.114.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.115.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.115.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.116.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.116.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.117.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.117.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.118.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.118.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.119.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.119.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.120.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.120.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.121.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.121.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.122.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.122.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.123.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.123.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.124.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.124.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.125.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.125.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.126.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.126.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.127.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.127.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.128.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.128.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.129.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.129.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.130.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.130.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.131.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.131.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.132.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.132.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.133.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.133.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.134.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.134.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.135.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.135.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.136.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.136.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.137.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.137.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.138.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.138.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.139.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.139.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.140.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.140.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.141.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.141.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.142.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.142.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.143.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.143.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.144.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.144.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.145.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.145.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.146.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.146.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.147.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.147.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.148.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.148.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.149.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.149.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.150.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.150.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.151.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.151.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.152.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.152.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.153.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.153.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.154.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.154.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.155.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.155.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.156.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.156.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.157.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.157.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.158.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.158.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.159.gate_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.159.up_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.0.down_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.1.down_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.2.down_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.3.down_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.4.down_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.5.down_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.6.down_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.7.down_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.8.down_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.9.down_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.10.down_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.11.down_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.12.down_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.13.down_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.14.down_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.15.down_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.16.down_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.17.down_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.18.down_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.19.down_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.20.down_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.21.down_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.22.down_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.23.down_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.24.down_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.25.down_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.26.down_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.27.down_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.28.down_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.29.down_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.30.down_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.31.down_proj.weight": "model-00002-of-00132.safetensors", + "model.layers.4.mlp.experts.32.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.33.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.34.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.35.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.36.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.37.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.38.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.39.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.40.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.41.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.42.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.43.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.44.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.45.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.46.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.47.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.48.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.49.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.50.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.51.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.52.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.53.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.54.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.55.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.56.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.57.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.58.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.59.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.60.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.61.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.62.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.63.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.64.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.65.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.66.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.67.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.68.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.69.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.70.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.71.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.72.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.73.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.74.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.75.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.76.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.77.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.78.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.79.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.80.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.81.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.82.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.83.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.84.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.85.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.86.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.87.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.88.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.89.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.90.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.91.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.92.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.93.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.94.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.95.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.96.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.97.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.98.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.99.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.100.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.101.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.102.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.103.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.104.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.105.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.106.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.107.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.108.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.109.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.110.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.111.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.112.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.113.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.114.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.115.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.116.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.117.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.118.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.119.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.120.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.121.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.122.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.123.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.124.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.125.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.126.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.127.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.128.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.129.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.130.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.131.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.132.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.133.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.134.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.135.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.136.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.137.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.138.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.139.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.140.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.141.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.142.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.143.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.144.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.145.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.146.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.147.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.148.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.149.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.150.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.151.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.152.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.153.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.154.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.155.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.156.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.157.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.158.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.experts.159.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.shared_experts.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.shared_experts.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.4.mlp.shared_experts.down_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.self_attn.q_proj.bias": "model-00003-of-00132.safetensors", + "model.layers.5.self_attn.k_proj.bias": "model-00003-of-00132.safetensors", + "model.layers.5.self_attn.v_proj.bias": "model-00003-of-00132.safetensors", + "model.layers.5.self_attn.q_norm.weight": "model-00003-of-00132.safetensors", + "model.layers.5.post_attention_layernorm.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.0.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.0.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.1.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.1.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.2.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.2.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.3.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.3.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.4.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.4.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.5.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.5.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.6.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.6.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.7.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.7.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.8.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.8.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.9.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.9.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.10.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.10.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.11.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.11.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.12.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.12.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.13.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.13.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.14.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.14.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.15.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.15.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.16.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.16.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.17.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.17.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.18.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.18.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.19.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.19.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.20.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.20.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.21.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.21.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.22.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.22.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.23.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.23.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.24.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.24.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.25.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.25.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.26.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.26.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.27.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.27.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.28.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.28.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.29.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.29.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.30.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.30.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.31.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.31.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.32.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.32.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.33.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.33.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.34.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.34.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.35.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.35.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.36.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.36.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.37.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.37.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.38.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.38.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.39.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.39.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.40.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.40.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.41.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.41.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.42.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.42.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.43.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.43.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.44.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.44.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.45.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.45.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.46.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.46.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.47.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.47.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.48.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.48.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.49.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.49.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.50.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.50.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.51.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.51.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.52.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.52.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.53.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.53.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.54.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.54.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.55.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.55.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.56.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.56.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.57.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.57.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.58.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.58.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.59.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.59.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.60.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.60.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.61.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.61.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.62.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.62.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.63.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.63.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.64.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.64.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.65.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.65.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.66.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.66.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.67.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.67.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.68.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.68.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.69.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.69.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.70.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.70.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.71.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.71.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.72.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.72.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.73.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.73.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.74.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.74.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.75.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.75.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.76.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.76.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.77.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.77.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.78.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.78.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.79.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.79.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.80.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.80.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.81.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.81.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.82.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.82.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.83.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.83.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.84.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.84.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.85.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.85.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.86.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.86.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.87.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.87.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.88.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.88.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.89.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.89.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.90.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.90.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.91.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.91.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.92.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.92.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.93.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.93.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.94.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.94.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.95.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.95.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.96.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.96.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.97.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.97.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.98.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.98.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.99.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.99.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.100.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.100.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.101.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.101.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.102.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.102.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.103.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.103.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.104.gate_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.104.up_proj.weight": "model-00003-of-00132.safetensors", + "model.layers.5.mlp.experts.105.gate_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.105.up_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.106.gate_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.106.up_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.107.gate_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.107.up_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.108.gate_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.108.up_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.109.gate_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.109.up_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.110.gate_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.110.up_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.111.gate_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.111.up_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.112.gate_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.112.up_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.113.gate_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.113.up_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.114.gate_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.114.up_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.115.gate_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.115.up_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.116.gate_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.116.up_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.117.gate_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.117.up_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.118.gate_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.118.up_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.119.gate_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.119.up_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.120.gate_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.120.up_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.121.gate_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.121.up_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.122.gate_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.122.up_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.123.gate_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.123.up_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.124.gate_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.124.up_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.125.gate_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.125.up_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.126.gate_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.126.up_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.127.gate_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.127.up_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.128.gate_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.128.up_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.129.gate_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.129.up_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.130.gate_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.130.up_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.131.gate_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.131.up_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.132.gate_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.132.up_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.133.gate_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.133.up_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.134.gate_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.134.up_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.135.gate_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.135.up_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.136.gate_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.136.up_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.137.gate_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.137.up_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.138.gate_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.138.up_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.139.gate_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.139.up_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.140.gate_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.140.up_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.141.gate_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.141.up_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.142.gate_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.142.up_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.143.gate_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.143.up_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.144.gate_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.144.up_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.145.gate_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.145.up_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.146.gate_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.146.up_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.147.gate_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.147.up_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.148.gate_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.148.up_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.149.gate_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.149.up_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.150.gate_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.150.up_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.151.gate_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.151.up_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.152.gate_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.152.up_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.153.gate_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.153.up_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.154.gate_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.154.up_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.155.gate_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.155.up_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.156.gate_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.156.up_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.157.gate_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.157.up_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.158.gate_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.158.up_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.159.gate_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.159.up_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.0.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.1.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.2.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.3.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.4.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.5.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.6.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.7.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.8.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.9.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.10.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.11.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.12.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.13.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.14.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.15.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.16.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.17.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.18.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.19.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.20.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.21.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.22.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.23.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.24.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.25.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.26.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.27.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.28.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.29.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.30.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.31.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.32.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.33.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.34.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.35.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.36.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.37.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.38.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.39.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.40.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.41.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.42.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.43.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.44.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.45.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.46.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.47.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.48.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.49.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.50.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.51.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.52.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.53.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.54.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.55.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.56.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.57.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.58.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.59.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.60.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.61.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.62.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.63.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.64.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.65.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.66.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.67.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.68.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.69.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.70.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.71.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.72.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.73.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.74.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.75.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.76.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.77.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.78.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.79.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.80.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.81.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.82.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.83.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.84.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.85.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.86.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.87.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.88.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.89.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.90.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.91.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.92.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.93.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.94.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.95.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.96.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.97.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.98.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.99.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.100.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.101.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.102.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.103.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.104.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.105.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.106.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.107.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.108.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.109.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.110.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.111.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.112.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.113.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.114.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.115.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.116.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.117.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.118.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.119.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.120.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.121.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.122.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.123.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.124.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.125.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.126.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.127.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.128.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.129.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.130.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.131.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.132.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.133.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.134.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.135.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.136.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.137.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.138.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.139.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.140.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.141.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.142.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.143.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.144.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.145.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.146.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.147.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.148.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.149.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.150.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.151.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.152.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.153.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.154.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.155.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.156.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.157.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.158.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.experts.159.down_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.shared_experts.gate_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.5.mlp.shared_experts.up_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.6.self_attn.o_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.6.self_attn.q_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.6.self_attn.k_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.6.self_attn.v_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.6.self_attn.q_norm.weight": "model-00004-of-00132.safetensors", + "model.layers.6.post_attention_layernorm.weight": "model-00004-of-00132.safetensors", + "model.layers.6.mlp.gate.weight": "model-00004-of-00132.safetensors", + "model.layers.6.mlp.gate.e_score_correction_bias": "model-00004-of-00132.safetensors", + "model.layers.6.mlp.experts.0.gate_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.6.mlp.experts.0.up_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.6.mlp.experts.1.gate_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.6.mlp.experts.1.up_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.6.mlp.experts.2.gate_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.6.mlp.experts.2.up_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.6.mlp.experts.3.gate_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.6.mlp.experts.3.up_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.6.mlp.experts.4.gate_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.6.mlp.experts.4.up_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.6.mlp.experts.5.gate_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.6.mlp.experts.5.up_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.6.mlp.experts.6.gate_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.6.mlp.experts.6.up_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.6.mlp.experts.7.gate_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.6.mlp.experts.7.up_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.6.mlp.experts.8.gate_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.6.mlp.experts.8.up_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.6.mlp.experts.9.gate_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.6.mlp.experts.9.up_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.6.mlp.experts.10.gate_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.6.mlp.experts.10.up_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.6.mlp.experts.11.gate_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.6.mlp.experts.11.up_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.6.mlp.experts.12.gate_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.6.mlp.experts.12.up_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.6.mlp.experts.13.gate_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.6.mlp.experts.13.up_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.6.mlp.experts.14.gate_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.6.mlp.experts.14.up_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.6.mlp.experts.15.gate_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.6.mlp.experts.15.up_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.6.mlp.experts.16.gate_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.6.mlp.experts.16.up_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.6.mlp.experts.17.gate_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.6.mlp.experts.17.up_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.6.mlp.experts.18.gate_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.6.mlp.experts.18.up_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.6.mlp.experts.19.gate_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.6.mlp.experts.19.up_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.6.mlp.experts.20.gate_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.6.mlp.experts.20.up_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.6.mlp.experts.21.gate_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.6.mlp.experts.21.up_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.6.mlp.experts.22.gate_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.6.mlp.experts.22.up_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.6.mlp.experts.23.gate_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.6.mlp.experts.23.up_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.6.mlp.experts.24.gate_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.6.mlp.experts.24.up_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.6.mlp.experts.25.gate_proj.weight": "model-00004-of-00132.safetensors", + "model.layers.6.mlp.experts.25.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.26.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.26.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.27.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.27.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.28.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.28.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.29.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.29.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.30.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.30.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.31.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.31.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.32.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.32.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.33.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.33.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.34.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.34.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.35.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.35.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.36.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.36.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.37.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.37.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.38.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.38.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.39.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.39.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.40.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.40.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.41.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.41.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.42.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.42.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.43.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.43.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.44.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.44.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.45.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.45.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.46.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.46.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.47.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.47.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.48.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.48.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.49.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.49.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.50.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.50.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.51.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.51.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.52.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.52.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.53.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.53.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.54.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.54.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.55.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.55.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.56.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.56.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.57.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.57.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.58.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.58.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.59.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.59.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.60.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.60.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.61.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.61.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.62.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.62.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.63.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.63.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.64.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.64.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.65.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.65.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.66.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.66.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.67.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.67.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.68.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.68.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.69.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.69.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.70.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.70.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.71.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.71.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.72.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.72.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.73.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.73.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.74.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.74.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.75.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.75.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.76.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.76.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.77.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.77.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.78.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.78.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.79.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.79.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.80.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.80.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.81.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.81.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.82.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.82.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.83.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.83.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.84.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.84.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.85.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.85.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.86.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.86.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.87.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.87.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.88.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.88.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.89.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.89.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.90.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.90.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.91.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.91.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.92.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.92.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.93.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.93.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.94.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.94.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.95.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.95.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.96.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.96.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.97.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.97.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.98.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.98.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.99.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.99.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.100.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.100.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.101.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.101.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.102.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.102.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.103.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.103.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.104.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.104.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.105.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.105.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.106.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.106.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.107.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.107.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.108.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.108.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.109.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.109.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.110.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.110.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.111.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.111.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.112.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.112.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.113.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.113.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.114.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.114.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.115.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.115.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.116.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.116.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.117.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.117.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.118.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.118.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.119.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.119.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.120.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.120.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.121.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.121.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.122.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.122.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.123.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.123.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.124.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.124.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.125.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.125.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.126.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.126.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.127.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.127.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.128.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.128.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.129.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.129.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.130.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.130.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.131.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.131.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.132.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.132.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.133.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.133.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.134.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.134.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.135.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.135.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.136.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.136.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.137.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.137.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.138.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.138.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.139.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.139.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.140.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.140.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.141.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.141.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.142.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.142.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.143.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.143.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.144.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.144.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.145.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.145.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.146.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.146.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.147.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.147.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.148.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.148.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.149.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.149.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.150.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.150.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.151.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.151.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.152.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.152.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.153.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.153.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.154.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.154.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.155.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.155.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.156.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.156.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.157.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.157.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.158.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.158.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.159.gate_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.159.up_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.0.down_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.1.down_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.2.down_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.3.down_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.4.down_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.5.down_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.6.down_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.7.down_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.8.down_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.9.down_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.10.down_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.11.down_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.12.down_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.13.down_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.14.down_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.15.down_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.16.down_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.17.down_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.18.down_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.19.down_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.20.down_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.21.down_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.22.down_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.23.down_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.24.down_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.25.down_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.26.down_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.27.down_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.28.down_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.29.down_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.30.down_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.31.down_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.32.down_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.33.down_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.34.down_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.35.down_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.36.down_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.37.down_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.38.down_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.39.down_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.40.down_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.41.down_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.42.down_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.43.down_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.44.down_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.45.down_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.46.down_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.47.down_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.48.down_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.49.down_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.50.down_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.51.down_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.52.down_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.53.down_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.54.down_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.55.down_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.56.down_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.57.down_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.58.down_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.59.down_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.60.down_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.61.down_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.62.down_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.63.down_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.64.down_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.65.down_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.66.down_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.67.down_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.68.down_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.69.down_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.70.down_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.71.down_proj.weight": "model-00005-of-00132.safetensors", + "model.layers.6.mlp.experts.72.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.73.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.74.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.75.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.76.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.77.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.78.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.79.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.80.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.81.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.82.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.83.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.84.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.85.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.86.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.87.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.88.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.89.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.90.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.91.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.92.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.93.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.94.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.95.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.96.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.97.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.98.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.99.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.100.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.101.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.102.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.103.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.104.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.105.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.106.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.107.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.108.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.109.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.110.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.111.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.112.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.113.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.114.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.115.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.116.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.117.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.118.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.119.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.120.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.121.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.122.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.123.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.124.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.125.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.126.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.127.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.128.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.129.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.130.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.131.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.132.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.133.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.134.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.135.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.136.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.137.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.138.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.139.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.140.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.141.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.142.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.143.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.144.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.145.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.146.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.147.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.148.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.149.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.150.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.151.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.152.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.153.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.154.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.155.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.156.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.157.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.158.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.experts.159.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.shared_experts.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.shared_experts.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.6.mlp.shared_experts.down_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.self_attn.q_proj.bias": "model-00006-of-00132.safetensors", + "model.layers.7.self_attn.k_proj.bias": "model-00006-of-00132.safetensors", + "model.layers.7.self_attn.v_proj.bias": "model-00006-of-00132.safetensors", + "model.layers.7.self_attn.q_norm.weight": "model-00006-of-00132.safetensors", + "model.layers.7.post_attention_layernorm.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.0.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.0.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.1.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.1.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.2.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.2.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.3.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.3.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.4.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.4.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.5.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.5.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.6.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.6.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.7.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.7.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.8.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.8.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.9.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.9.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.10.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.10.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.11.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.11.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.12.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.12.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.13.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.13.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.14.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.14.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.15.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.15.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.16.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.16.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.17.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.17.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.18.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.18.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.19.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.19.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.20.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.20.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.21.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.21.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.22.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.22.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.23.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.23.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.24.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.24.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.25.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.25.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.26.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.26.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.27.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.27.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.28.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.28.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.29.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.29.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.30.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.30.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.31.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.31.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.32.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.32.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.33.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.33.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.34.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.34.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.35.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.35.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.36.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.36.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.37.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.37.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.38.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.38.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.39.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.39.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.40.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.40.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.41.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.41.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.42.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.42.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.43.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.43.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.44.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.44.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.45.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.45.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.46.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.46.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.47.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.47.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.48.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.48.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.49.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.49.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.50.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.50.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.51.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.51.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.52.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.52.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.53.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.53.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.54.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.54.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.55.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.55.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.56.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.56.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.57.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.57.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.58.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.58.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.59.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.59.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.60.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.60.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.61.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.61.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.62.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.62.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.63.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.63.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.64.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.64.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.65.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.65.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.66.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.66.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.67.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.67.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.68.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.68.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.69.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.69.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.70.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.70.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.71.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.71.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.72.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.72.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.73.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.73.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.74.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.74.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.75.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.75.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.76.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.76.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.77.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.77.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.78.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.78.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.79.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.79.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.80.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.80.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.81.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.81.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.82.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.82.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.83.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.83.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.84.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.84.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.85.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.85.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.86.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.86.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.87.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.87.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.88.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.88.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.89.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.89.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.90.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.90.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.91.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.91.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.92.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.92.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.93.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.93.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.94.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.94.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.95.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.95.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.96.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.96.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.97.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.97.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.98.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.98.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.99.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.99.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.100.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.100.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.101.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.101.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.102.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.102.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.103.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.103.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.104.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.104.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.105.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.105.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.106.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.106.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.107.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.107.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.108.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.108.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.109.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.109.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.110.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.110.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.111.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.111.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.112.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.112.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.113.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.113.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.114.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.114.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.115.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.115.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.116.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.116.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.117.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.117.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.118.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.118.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.119.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.119.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.120.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.120.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.121.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.121.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.122.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.122.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.123.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.123.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.124.gate_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.124.up_proj.weight": "model-00006-of-00132.safetensors", + "model.layers.7.mlp.experts.125.gate_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.125.up_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.126.gate_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.126.up_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.127.gate_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.127.up_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.128.gate_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.128.up_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.129.gate_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.129.up_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.130.gate_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.130.up_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.131.gate_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.131.up_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.132.gate_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.132.up_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.133.gate_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.133.up_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.134.gate_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.134.up_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.135.gate_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.135.up_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.136.gate_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.136.up_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.137.gate_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.137.up_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.138.gate_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.138.up_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.139.gate_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.139.up_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.140.gate_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.140.up_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.141.gate_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.141.up_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.142.gate_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.142.up_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.143.gate_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.143.up_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.144.gate_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.144.up_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.145.gate_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.145.up_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.146.gate_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.146.up_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.147.gate_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.147.up_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.148.gate_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.148.up_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.149.gate_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.149.up_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.150.gate_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.150.up_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.151.gate_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.151.up_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.152.gate_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.152.up_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.153.gate_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.153.up_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.154.gate_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.154.up_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.155.gate_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.155.up_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.156.gate_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.156.up_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.157.gate_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.157.up_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.158.gate_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.158.up_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.159.gate_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.159.up_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.0.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.1.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.2.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.3.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.4.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.5.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.6.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.7.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.8.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.9.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.10.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.11.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.12.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.13.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.14.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.15.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.16.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.17.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.18.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.19.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.20.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.21.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.22.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.23.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.24.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.25.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.26.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.27.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.28.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.29.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.30.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.31.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.32.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.33.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.34.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.35.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.36.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.37.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.38.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.39.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.40.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.41.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.42.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.43.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.44.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.45.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.46.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.47.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.48.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.49.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.50.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.51.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.52.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.53.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.54.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.55.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.56.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.57.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.58.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.59.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.60.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.61.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.62.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.63.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.64.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.65.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.66.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.67.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.68.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.69.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.70.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.71.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.72.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.73.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.74.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.75.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.76.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.77.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.78.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.79.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.80.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.81.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.82.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.83.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.84.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.85.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.86.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.87.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.88.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.89.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.90.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.91.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.92.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.93.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.94.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.95.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.96.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.97.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.98.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.99.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.100.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.101.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.102.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.103.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.104.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.105.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.106.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.107.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.108.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.109.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.110.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.111.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.112.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.113.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.114.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.115.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.116.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.117.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.118.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.119.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.120.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.121.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.122.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.123.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.124.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.125.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.126.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.127.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.128.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.129.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.130.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.131.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.132.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.133.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.134.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.135.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.136.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.137.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.138.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.139.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.140.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.141.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.142.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.143.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.144.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.145.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.146.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.147.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.148.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.149.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.150.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.151.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.152.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.153.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.154.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.155.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.156.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.157.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.158.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.experts.159.down_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.shared_experts.gate_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.7.mlp.shared_experts.up_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.self_attn.o_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.self_attn.q_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.self_attn.k_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.self_attn.v_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.self_attn.q_norm.weight": "model-00007-of-00132.safetensors", + "model.layers.8.post_attention_layernorm.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.gate.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.gate.e_score_correction_bias": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.0.gate_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.0.up_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.1.gate_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.1.up_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.2.gate_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.2.up_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.3.gate_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.3.up_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.4.gate_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.4.up_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.5.gate_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.5.up_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.6.gate_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.6.up_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.7.gate_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.7.up_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.8.gate_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.8.up_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.9.gate_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.9.up_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.10.gate_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.10.up_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.11.gate_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.11.up_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.12.gate_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.12.up_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.13.gate_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.13.up_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.14.gate_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.14.up_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.15.gate_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.15.up_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.16.gate_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.16.up_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.17.gate_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.17.up_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.18.gate_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.18.up_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.19.gate_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.19.up_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.20.gate_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.20.up_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.21.gate_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.21.up_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.22.gate_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.22.up_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.23.gate_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.23.up_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.24.gate_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.24.up_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.25.gate_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.25.up_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.26.gate_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.26.up_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.27.gate_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.27.up_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.28.gate_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.28.up_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.29.gate_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.29.up_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.30.gate_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.30.up_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.31.gate_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.31.up_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.32.gate_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.32.up_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.33.gate_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.33.up_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.34.gate_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.34.up_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.35.gate_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.35.up_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.36.gate_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.36.up_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.37.gate_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.37.up_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.38.gate_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.38.up_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.39.gate_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.39.up_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.40.gate_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.40.up_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.41.gate_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.41.up_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.42.gate_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.42.up_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.43.gate_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.43.up_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.44.gate_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.44.up_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.45.gate_proj.weight": "model-00007-of-00132.safetensors", + "model.layers.8.mlp.experts.45.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.46.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.46.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.47.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.47.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.48.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.48.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.49.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.49.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.50.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.50.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.51.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.51.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.52.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.52.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.53.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.53.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.54.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.54.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.55.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.55.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.56.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.56.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.57.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.57.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.58.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.58.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.59.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.59.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.60.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.60.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.61.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.61.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.62.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.62.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.63.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.63.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.64.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.64.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.65.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.65.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.66.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.66.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.67.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.67.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.68.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.68.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.69.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.69.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.70.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.70.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.71.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.71.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.72.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.72.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.73.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.73.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.74.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.74.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.75.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.75.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.76.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.76.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.77.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.77.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.78.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.78.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.79.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.79.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.80.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.80.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.81.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.81.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.82.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.82.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.83.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.83.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.84.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.84.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.85.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.85.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.86.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.86.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.87.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.87.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.88.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.88.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.89.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.89.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.90.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.90.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.91.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.91.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.92.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.92.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.93.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.93.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.94.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.94.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.95.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.95.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.96.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.96.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.97.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.97.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.98.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.98.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.99.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.99.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.100.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.100.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.101.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.101.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.102.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.102.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.103.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.103.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.104.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.104.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.105.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.105.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.106.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.106.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.107.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.107.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.108.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.108.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.109.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.109.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.110.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.110.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.111.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.111.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.112.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.112.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.113.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.113.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.114.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.114.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.115.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.115.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.116.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.116.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.117.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.117.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.118.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.118.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.119.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.119.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.120.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.120.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.121.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.121.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.122.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.122.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.123.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.123.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.124.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.124.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.125.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.125.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.126.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.126.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.127.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.127.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.128.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.128.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.129.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.129.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.130.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.130.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.131.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.131.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.132.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.132.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.133.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.133.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.134.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.134.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.135.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.135.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.136.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.136.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.137.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.137.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.138.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.138.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.139.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.139.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.140.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.140.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.141.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.141.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.142.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.142.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.143.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.143.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.144.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.144.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.145.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.145.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.146.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.146.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.147.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.147.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.148.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.148.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.149.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.149.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.150.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.150.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.151.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.151.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.152.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.152.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.153.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.153.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.154.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.154.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.155.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.155.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.156.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.156.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.157.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.157.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.158.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.158.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.159.gate_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.159.up_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.0.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.1.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.2.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.3.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.4.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.5.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.6.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.7.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.8.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.9.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.10.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.11.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.12.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.13.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.14.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.15.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.16.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.17.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.18.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.19.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.20.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.21.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.22.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.23.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.24.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.25.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.26.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.27.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.28.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.29.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.30.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.31.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.32.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.33.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.34.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.35.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.36.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.37.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.38.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.39.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.40.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.41.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.42.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.43.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.44.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.45.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.46.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.47.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.48.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.49.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.50.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.51.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.52.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.53.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.54.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.55.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.56.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.57.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.58.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.59.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.60.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.61.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.62.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.63.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.64.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.65.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.66.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.67.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.68.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.69.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.70.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.71.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.72.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.73.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.74.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.75.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.76.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.77.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.78.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.79.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.80.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.81.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.82.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.83.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.84.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.85.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.86.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.87.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.88.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.89.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.90.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.91.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.92.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.93.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.94.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.95.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.96.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.97.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.98.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.99.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.100.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.101.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.102.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.103.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.104.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.105.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.106.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.107.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.108.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.109.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.110.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.111.down_proj.weight": "model-00008-of-00132.safetensors", + "model.layers.8.mlp.experts.112.down_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.8.mlp.experts.113.down_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.8.mlp.experts.114.down_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.8.mlp.experts.115.down_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.8.mlp.experts.116.down_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.8.mlp.experts.117.down_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.8.mlp.experts.118.down_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.8.mlp.experts.119.down_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.8.mlp.experts.120.down_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.8.mlp.experts.121.down_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.8.mlp.experts.122.down_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.8.mlp.experts.123.down_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.8.mlp.experts.124.down_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.8.mlp.experts.125.down_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.8.mlp.experts.126.down_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.8.mlp.experts.127.down_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.8.mlp.experts.128.down_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.8.mlp.experts.129.down_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.8.mlp.experts.130.down_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.8.mlp.experts.131.down_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.8.mlp.experts.132.down_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.8.mlp.experts.133.down_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.8.mlp.experts.134.down_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.8.mlp.experts.135.down_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.8.mlp.experts.136.down_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.8.mlp.experts.137.down_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.8.mlp.experts.138.down_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.8.mlp.experts.139.down_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.8.mlp.experts.140.down_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.8.mlp.experts.141.down_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.8.mlp.experts.142.down_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.8.mlp.experts.143.down_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.8.mlp.experts.144.down_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.8.mlp.experts.145.down_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.8.mlp.experts.146.down_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.8.mlp.experts.147.down_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.8.mlp.experts.148.down_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.8.mlp.experts.149.down_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.8.mlp.experts.150.down_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.8.mlp.experts.151.down_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.8.mlp.experts.152.down_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.8.mlp.experts.153.down_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.8.mlp.experts.154.down_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.8.mlp.experts.155.down_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.8.mlp.experts.156.down_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.8.mlp.experts.157.down_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.8.mlp.experts.158.down_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.8.mlp.experts.159.down_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.8.mlp.shared_experts.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.8.mlp.shared_experts.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.8.mlp.shared_experts.down_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.self_attn.q_proj.bias": "model-00009-of-00132.safetensors", + "model.layers.9.self_attn.k_proj.bias": "model-00009-of-00132.safetensors", + "model.layers.9.self_attn.v_proj.bias": "model-00009-of-00132.safetensors", + "model.layers.9.self_attn.q_norm.weight": "model-00009-of-00132.safetensors", + "model.layers.9.post_attention_layernorm.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.0.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.0.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.1.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.1.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.2.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.2.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.3.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.3.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.4.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.4.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.5.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.5.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.6.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.6.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.7.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.7.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.8.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.8.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.9.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.9.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.10.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.10.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.11.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.11.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.12.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.12.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.13.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.13.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.14.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.14.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.15.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.15.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.16.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.16.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.17.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.17.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.18.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.18.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.19.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.19.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.20.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.20.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.21.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.21.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.22.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.22.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.23.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.23.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.24.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.24.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.25.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.25.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.26.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.26.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.27.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.27.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.28.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.28.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.29.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.29.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.30.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.30.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.31.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.31.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.32.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.32.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.33.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.33.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.34.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.34.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.35.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.35.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.36.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.36.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.37.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.37.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.38.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.38.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.39.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.39.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.40.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.40.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.41.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.41.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.42.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.42.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.43.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.43.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.44.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.44.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.45.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.45.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.46.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.46.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.47.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.47.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.48.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.48.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.49.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.49.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.50.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.50.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.51.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.51.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.52.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.52.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.53.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.53.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.54.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.54.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.55.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.55.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.56.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.56.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.57.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.57.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.58.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.58.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.59.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.59.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.60.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.60.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.61.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.61.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.62.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.62.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.63.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.63.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.64.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.64.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.65.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.65.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.66.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.66.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.67.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.67.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.68.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.68.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.69.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.69.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.70.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.70.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.71.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.71.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.72.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.72.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.73.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.73.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.74.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.74.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.75.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.75.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.76.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.76.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.77.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.77.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.78.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.78.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.79.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.79.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.80.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.80.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.81.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.81.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.82.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.82.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.83.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.83.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.84.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.84.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.85.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.85.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.86.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.86.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.87.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.87.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.88.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.88.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.89.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.89.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.90.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.90.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.91.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.91.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.92.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.92.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.93.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.93.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.94.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.94.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.95.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.95.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.96.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.96.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.97.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.97.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.98.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.98.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.99.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.99.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.100.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.100.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.101.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.101.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.102.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.102.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.103.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.103.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.104.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.104.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.105.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.105.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.106.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.106.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.107.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.107.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.108.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.108.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.109.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.109.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.110.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.110.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.111.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.111.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.112.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.112.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.113.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.113.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.114.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.114.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.115.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.115.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.116.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.116.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.117.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.117.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.118.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.118.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.119.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.119.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.120.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.120.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.121.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.121.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.122.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.122.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.123.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.123.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.124.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.124.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.125.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.125.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.126.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.126.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.127.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.127.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.128.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.128.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.129.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.129.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.130.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.130.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.131.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.131.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.132.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.132.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.133.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.133.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.134.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.134.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.135.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.135.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.136.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.136.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.137.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.137.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.138.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.138.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.139.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.139.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.140.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.140.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.141.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.141.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.142.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.142.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.143.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.143.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.144.gate_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.144.up_proj.weight": "model-00009-of-00132.safetensors", + "model.layers.9.mlp.experts.145.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.145.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.146.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.146.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.147.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.147.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.148.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.148.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.149.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.149.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.150.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.150.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.151.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.151.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.152.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.152.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.153.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.153.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.154.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.154.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.155.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.155.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.156.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.156.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.157.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.157.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.158.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.158.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.159.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.159.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.0.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.1.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.2.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.3.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.4.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.5.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.6.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.7.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.8.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.9.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.10.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.11.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.12.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.13.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.14.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.15.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.16.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.17.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.18.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.19.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.20.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.21.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.22.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.23.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.24.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.25.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.26.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.27.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.28.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.29.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.30.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.31.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.32.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.33.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.34.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.35.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.36.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.37.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.38.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.39.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.40.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.41.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.42.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.43.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.44.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.45.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.46.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.47.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.48.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.49.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.50.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.51.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.52.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.53.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.54.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.55.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.56.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.57.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.58.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.59.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.60.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.61.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.62.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.63.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.64.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.65.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.66.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.67.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.68.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.69.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.70.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.71.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.72.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.73.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.74.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.75.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.76.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.77.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.78.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.79.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.80.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.81.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.82.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.83.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.84.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.85.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.86.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.87.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.88.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.89.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.90.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.91.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.92.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.93.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.94.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.95.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.96.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.97.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.98.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.99.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.100.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.101.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.102.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.103.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.104.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.105.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.106.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.107.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.108.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.109.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.110.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.111.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.112.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.113.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.114.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.115.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.116.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.117.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.118.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.119.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.120.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.121.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.122.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.123.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.124.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.125.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.126.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.127.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.128.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.129.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.130.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.131.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.132.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.133.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.134.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.135.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.136.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.137.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.138.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.139.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.140.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.141.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.142.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.143.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.144.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.145.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.146.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.147.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.148.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.149.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.150.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.151.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.152.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.153.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.154.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.155.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.156.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.157.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.158.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.experts.159.down_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.shared_experts.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.9.mlp.shared_experts.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.self_attn.o_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.self_attn.q_proj.bias": "model-00010-of-00132.safetensors", + "model.layers.10.self_attn.k_proj.bias": "model-00010-of-00132.safetensors", + "model.layers.10.self_attn.v_proj.bias": "model-00010-of-00132.safetensors", + "model.layers.10.self_attn.q_norm.weight": "model-00010-of-00132.safetensors", + "model.layers.10.post_attention_layernorm.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.gate.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.0.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.0.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.1.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.1.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.2.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.2.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.3.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.3.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.4.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.4.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.5.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.5.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.6.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.6.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.7.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.7.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.8.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.8.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.9.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.9.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.10.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.10.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.11.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.11.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.12.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.12.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.13.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.13.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.14.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.14.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.15.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.15.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.16.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.16.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.17.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.17.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.18.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.18.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.19.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.19.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.20.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.20.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.21.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.21.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.22.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.22.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.23.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.23.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.24.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.24.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.25.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.25.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.26.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.26.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.27.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.27.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.28.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.28.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.29.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.29.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.30.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.30.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.31.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.31.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.32.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.32.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.33.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.33.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.34.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.34.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.35.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.35.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.36.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.36.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.37.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.37.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.38.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.38.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.39.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.39.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.40.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.40.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.41.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.41.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.42.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.42.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.43.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.43.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.44.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.44.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.45.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.45.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.46.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.46.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.47.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.47.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.48.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.48.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.49.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.49.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.50.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.50.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.51.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.51.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.52.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.52.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.53.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.53.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.54.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.54.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.55.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.55.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.56.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.56.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.57.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.57.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.58.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.58.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.59.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.59.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.60.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.60.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.61.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.61.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.62.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.62.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.63.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.63.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.64.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.64.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.65.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.65.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.66.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.66.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.67.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.67.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.68.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.68.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.69.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.69.up_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.70.gate_proj.weight": "model-00010-of-00132.safetensors", + "model.layers.10.mlp.experts.70.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.71.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.71.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.72.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.72.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.73.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.73.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.74.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.74.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.75.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.75.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.76.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.76.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.77.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.77.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.78.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.78.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.79.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.79.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.80.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.80.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.81.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.81.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.82.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.82.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.83.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.83.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.84.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.84.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.85.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.85.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.86.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.86.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.87.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.87.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.88.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.88.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.89.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.89.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.90.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.90.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.91.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.91.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.92.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.92.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.93.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.93.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.94.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.94.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.95.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.95.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.96.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.96.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.97.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.97.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.98.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.98.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.99.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.99.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.100.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.100.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.101.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.101.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.102.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.102.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.103.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.103.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.104.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.104.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.105.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.105.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.106.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.106.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.107.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.107.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.108.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.108.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.109.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.109.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.110.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.110.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.111.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.111.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.112.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.112.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.113.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.113.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.114.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.114.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.115.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.115.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.116.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.116.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.117.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.117.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.118.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.118.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.119.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.119.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.120.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.120.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.121.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.121.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.122.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.122.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.123.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.123.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.124.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.124.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.125.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.125.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.126.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.126.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.127.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.127.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.128.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.128.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.129.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.129.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.130.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.130.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.131.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.131.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.132.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.132.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.133.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.133.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.134.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.134.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.135.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.135.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.136.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.136.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.137.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.137.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.138.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.138.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.139.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.139.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.140.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.140.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.141.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.141.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.142.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.142.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.143.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.143.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.144.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.144.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.145.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.145.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.146.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.146.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.147.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.147.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.148.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.148.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.149.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.149.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.150.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.150.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.151.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.151.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.152.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.152.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.153.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.153.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.154.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.154.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.155.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.155.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.156.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.156.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.157.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.157.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.158.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.158.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.159.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.159.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.0.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.1.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.2.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.3.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.4.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.5.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.6.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.7.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.8.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.9.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.10.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.11.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.12.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.13.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.14.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.15.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.16.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.17.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.18.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.19.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.20.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.21.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.22.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.23.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.24.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.25.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.26.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.27.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.28.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.29.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.30.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.31.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.32.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.33.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.34.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.35.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.36.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.37.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.38.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.39.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.40.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.41.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.42.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.43.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.44.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.45.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.46.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.47.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.48.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.49.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.50.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.51.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.52.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.53.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.54.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.55.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.56.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.57.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.58.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.59.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.60.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.61.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.62.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.63.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.64.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.65.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.66.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.67.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.68.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.69.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.70.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.71.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.72.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.73.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.74.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.75.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.76.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.77.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.78.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.79.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.80.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.81.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.82.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.83.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.84.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.85.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.86.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.87.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.88.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.89.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.90.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.91.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.92.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.93.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.94.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.95.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.96.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.97.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.98.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.99.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.100.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.101.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.102.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.103.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.104.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.105.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.106.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.107.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.108.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.109.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.110.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.111.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.112.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.113.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.114.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.115.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.116.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.117.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.118.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.119.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.120.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.121.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.122.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.123.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.124.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.125.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.126.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.127.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.128.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.129.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.130.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.131.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.132.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.133.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.134.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.135.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.136.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.137.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.138.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.139.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.140.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.141.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.142.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.143.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.144.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.145.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.146.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.147.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.148.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.149.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.150.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.151.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.152.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.153.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.154.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.155.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.156.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.157.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.158.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.experts.159.down_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.shared_experts.gate_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.shared_experts.up_proj.weight": "model-00011-of-00132.safetensors", + "model.layers.10.mlp.shared_experts.down_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.self_attn.q_norm.weight": "model-00012-of-00132.safetensors", + "model.layers.11.post_attention_layernorm.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.0.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.0.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.1.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.1.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.2.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.2.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.3.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.3.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.4.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.4.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.5.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.5.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.6.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.6.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.7.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.7.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.8.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.8.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.9.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.9.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.10.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.10.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.11.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.11.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.12.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.12.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.13.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.13.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.14.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.14.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.15.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.15.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.16.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.16.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.17.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.17.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.18.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.18.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.19.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.19.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.20.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.20.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.21.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.21.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.22.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.22.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.23.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.23.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.24.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.24.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.25.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.25.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.26.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.26.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.27.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.27.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.28.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.28.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.29.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.29.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.30.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.30.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.31.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.31.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.32.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.32.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.33.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.33.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.34.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.34.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.35.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.35.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.36.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.36.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.37.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.37.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.38.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.38.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.39.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.39.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.40.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.40.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.41.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.41.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.42.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.42.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.43.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.43.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.44.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.44.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.45.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.45.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.46.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.46.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.47.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.47.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.48.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.48.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.49.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.49.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.50.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.50.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.51.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.51.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.52.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.52.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.53.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.53.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.54.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.54.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.55.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.55.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.56.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.56.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.57.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.57.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.58.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.58.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.59.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.59.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.60.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.60.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.61.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.61.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.62.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.62.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.63.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.63.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.64.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.64.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.65.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.65.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.66.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.66.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.67.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.67.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.68.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.68.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.69.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.69.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.70.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.70.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.71.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.71.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.72.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.72.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.73.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.73.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.74.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.74.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.75.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.75.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.76.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.76.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.77.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.77.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.78.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.78.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.79.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.79.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.80.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.80.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.81.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.81.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.82.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.82.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.83.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.83.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.84.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.84.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.85.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.85.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.86.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.86.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.87.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.87.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.88.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.88.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.89.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.89.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.90.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.90.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.91.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.91.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.92.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.92.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.93.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.93.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.94.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.94.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.95.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.95.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.96.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.96.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.97.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.97.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.98.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.98.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.99.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.99.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.100.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.100.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.101.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.101.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.102.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.102.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.103.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.103.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.104.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.104.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.105.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.105.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.106.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.106.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.107.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.107.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.108.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.108.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.109.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.109.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.110.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.110.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.111.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.111.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.112.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.112.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.113.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.113.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.114.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.114.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.115.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.115.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.116.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.116.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.117.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.117.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.118.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.118.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.119.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.119.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.120.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.120.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.121.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.121.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.122.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.122.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.123.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.123.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.124.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.124.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.125.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.125.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.126.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.126.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.127.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.127.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.128.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.128.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.129.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.129.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.130.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.130.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.131.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.131.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.132.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.132.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.133.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.133.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.134.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.134.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.135.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.135.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.136.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.136.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.137.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.137.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.138.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.138.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.139.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.139.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.140.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.140.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.141.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.141.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.142.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.142.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.143.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.143.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.144.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.144.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.145.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.145.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.146.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.146.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.147.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.147.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.148.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.148.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.149.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.149.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.150.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.150.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.151.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.151.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.152.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.152.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.153.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.153.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.154.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.154.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.155.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.155.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.156.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.156.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.157.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.157.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.158.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.158.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.159.gate_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.159.up_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.0.down_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.1.down_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.2.down_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.3.down_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.4.down_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.5.down_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.6.down_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.7.down_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.8.down_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.9.down_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.10.down_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.11.down_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.12.down_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.13.down_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.14.down_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.15.down_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.16.down_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.17.down_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.18.down_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.19.down_proj.weight": "model-00012-of-00132.safetensors", + "model.layers.11.mlp.experts.20.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.21.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.22.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.23.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.24.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.25.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.26.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.27.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.28.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.29.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.30.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.31.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.32.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.33.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.34.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.35.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.36.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.37.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.38.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.39.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.40.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.41.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.42.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.43.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.44.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.45.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.46.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.47.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.48.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.49.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.50.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.51.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.52.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.53.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.54.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.55.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.56.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.57.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.58.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.59.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.60.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.61.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.62.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.63.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.64.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.65.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.66.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.67.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.68.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.69.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.70.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.71.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.72.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.73.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.74.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.75.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.76.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.77.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.78.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.79.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.80.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.81.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.82.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.83.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.84.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.85.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.86.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.87.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.88.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.89.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.90.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.91.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.92.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.93.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.94.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.95.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.96.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.97.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.98.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.99.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.100.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.101.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.102.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.103.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.104.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.105.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.106.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.107.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.108.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.109.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.110.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.111.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.112.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.113.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.114.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.115.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.116.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.117.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.118.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.119.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.120.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.121.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.122.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.123.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.124.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.125.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.126.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.127.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.128.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.129.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.130.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.131.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.132.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.133.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.134.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.135.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.136.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.137.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.138.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.139.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.140.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.141.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.142.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.143.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.144.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.145.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.146.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.147.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.148.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.149.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.150.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.151.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.152.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.153.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.154.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.155.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.156.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.157.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.158.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.experts.159.down_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.shared_experts.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.11.mlp.shared_experts.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.self_attn.o_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.self_attn.q_proj.bias": "model-00013-of-00132.safetensors", + "model.layers.12.self_attn.k_proj.bias": "model-00013-of-00132.safetensors", + "model.layers.12.self_attn.v_proj.bias": "model-00013-of-00132.safetensors", + "model.layers.12.self_attn.q_norm.weight": "model-00013-of-00132.safetensors", + "model.layers.12.post_attention_layernorm.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.gate.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.0.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.0.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.1.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.1.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.2.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.2.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.3.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.3.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.4.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.4.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.5.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.5.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.6.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.6.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.7.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.7.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.8.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.8.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.9.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.9.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.10.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.10.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.11.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.11.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.12.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.12.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.13.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.13.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.14.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.14.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.15.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.15.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.16.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.16.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.17.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.17.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.18.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.18.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.19.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.19.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.20.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.20.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.21.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.21.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.22.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.22.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.23.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.23.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.24.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.24.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.25.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.25.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.26.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.26.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.27.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.27.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.28.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.28.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.29.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.29.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.30.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.30.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.31.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.31.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.32.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.32.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.33.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.33.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.34.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.34.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.35.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.35.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.36.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.36.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.37.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.37.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.38.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.38.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.39.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.39.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.40.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.40.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.41.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.41.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.42.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.42.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.43.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.43.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.44.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.44.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.45.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.45.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.46.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.46.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.47.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.47.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.48.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.48.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.49.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.49.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.50.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.50.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.51.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.51.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.52.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.52.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.53.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.53.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.54.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.54.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.55.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.55.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.56.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.56.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.57.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.57.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.58.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.58.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.59.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.59.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.60.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.60.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.61.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.61.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.62.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.62.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.63.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.63.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.64.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.64.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.65.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.65.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.66.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.66.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.67.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.67.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.68.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.68.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.69.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.69.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.70.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.70.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.71.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.71.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.72.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.72.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.73.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.73.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.74.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.74.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.75.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.75.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.76.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.76.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.77.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.77.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.78.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.78.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.79.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.79.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.80.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.80.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.81.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.81.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.82.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.82.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.83.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.83.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.84.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.84.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.85.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.85.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.86.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.86.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.87.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.87.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.88.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.88.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.89.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.89.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.90.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.90.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.91.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.91.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.92.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.92.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.93.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.93.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.94.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.94.up_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.95.gate_proj.weight": "model-00013-of-00132.safetensors", + "model.layers.12.mlp.experts.95.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.96.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.96.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.97.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.97.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.98.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.98.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.99.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.99.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.100.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.100.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.101.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.101.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.102.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.102.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.103.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.103.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.104.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.104.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.105.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.105.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.106.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.106.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.107.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.107.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.108.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.108.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.109.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.109.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.110.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.110.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.111.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.111.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.112.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.112.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.113.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.113.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.114.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.114.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.115.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.115.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.116.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.116.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.117.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.117.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.118.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.118.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.119.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.119.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.120.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.120.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.121.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.121.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.122.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.122.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.123.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.123.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.124.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.124.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.125.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.125.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.126.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.126.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.127.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.127.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.128.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.128.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.129.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.129.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.130.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.130.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.131.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.131.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.132.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.132.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.133.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.133.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.134.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.134.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.135.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.135.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.136.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.136.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.137.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.137.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.138.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.138.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.139.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.139.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.140.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.140.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.141.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.141.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.142.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.142.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.143.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.143.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.144.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.144.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.145.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.145.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.146.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.146.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.147.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.147.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.148.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.148.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.149.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.149.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.150.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.150.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.151.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.151.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.152.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.152.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.153.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.153.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.154.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.154.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.155.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.155.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.156.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.156.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.157.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.157.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.158.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.158.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.159.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.159.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.0.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.1.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.2.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.3.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.4.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.5.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.6.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.7.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.8.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.9.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.10.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.11.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.12.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.13.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.14.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.15.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.16.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.17.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.18.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.19.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.20.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.21.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.22.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.23.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.24.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.25.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.26.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.27.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.28.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.29.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.30.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.31.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.32.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.33.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.34.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.35.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.36.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.37.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.38.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.39.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.40.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.41.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.42.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.43.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.44.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.45.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.46.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.47.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.48.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.49.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.50.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.51.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.52.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.53.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.54.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.55.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.56.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.57.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.58.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.59.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.60.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.61.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.62.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.63.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.64.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.65.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.66.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.67.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.68.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.69.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.70.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.71.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.72.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.73.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.74.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.75.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.76.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.77.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.78.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.79.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.80.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.81.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.82.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.83.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.84.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.85.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.86.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.87.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.88.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.89.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.90.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.91.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.92.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.93.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.94.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.95.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.96.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.97.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.98.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.99.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.100.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.101.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.102.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.103.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.104.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.105.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.106.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.107.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.108.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.109.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.110.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.111.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.112.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.113.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.114.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.115.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.116.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.117.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.118.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.119.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.120.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.121.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.122.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.123.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.124.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.125.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.126.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.127.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.128.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.129.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.130.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.131.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.132.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.133.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.134.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.135.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.136.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.137.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.138.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.139.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.140.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.141.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.142.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.143.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.144.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.145.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.146.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.147.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.148.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.149.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.150.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.151.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.152.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.153.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.154.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.155.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.156.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.157.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.158.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.experts.159.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.shared_experts.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.shared_experts.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.12.mlp.shared_experts.down_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.13.self_attn.q_norm.weight": "model-00014-of-00132.safetensors", + "model.layers.13.post_attention_layernorm.weight": "model-00014-of-00132.safetensors", + "model.layers.13.mlp.experts.0.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.13.mlp.experts.0.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.13.mlp.experts.1.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.13.mlp.experts.1.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.13.mlp.experts.2.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.13.mlp.experts.2.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.13.mlp.experts.3.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.13.mlp.experts.3.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.13.mlp.experts.4.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.13.mlp.experts.4.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.13.mlp.experts.5.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.13.mlp.experts.5.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.13.mlp.experts.6.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.13.mlp.experts.6.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.13.mlp.experts.7.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.13.mlp.experts.7.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.13.mlp.experts.8.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.13.mlp.experts.8.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.13.mlp.experts.9.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.13.mlp.experts.9.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.13.mlp.experts.10.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.13.mlp.experts.10.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.13.mlp.experts.11.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.13.mlp.experts.11.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.13.mlp.experts.12.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.13.mlp.experts.12.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.13.mlp.experts.13.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.13.mlp.experts.13.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.13.mlp.experts.14.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.13.mlp.experts.14.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.13.mlp.experts.15.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.13.mlp.experts.15.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.13.mlp.experts.16.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.13.mlp.experts.16.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.13.mlp.experts.17.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.13.mlp.experts.17.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.13.mlp.experts.18.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.13.mlp.experts.18.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.13.mlp.experts.19.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.13.mlp.experts.19.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.13.mlp.experts.20.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.13.mlp.experts.20.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.13.mlp.experts.21.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.13.mlp.experts.21.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.13.mlp.experts.22.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.13.mlp.experts.22.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.13.mlp.experts.23.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.13.mlp.experts.23.up_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.13.mlp.experts.24.gate_proj.weight": "model-00014-of-00132.safetensors", + "model.layers.13.mlp.experts.24.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.25.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.25.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.26.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.26.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.27.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.27.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.28.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.28.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.29.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.29.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.30.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.30.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.31.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.31.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.32.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.32.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.33.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.33.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.34.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.34.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.35.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.35.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.36.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.36.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.37.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.37.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.38.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.38.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.39.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.39.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.40.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.40.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.41.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.41.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.42.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.42.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.43.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.43.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.44.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.44.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.45.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.45.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.46.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.46.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.47.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.47.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.48.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.48.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.49.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.49.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.50.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.50.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.51.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.51.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.52.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.52.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.53.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.53.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.54.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.54.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.55.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.55.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.56.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.56.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.57.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.57.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.58.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.58.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.59.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.59.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.60.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.60.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.61.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.61.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.62.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.62.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.63.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.63.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.64.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.64.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.65.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.65.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.66.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.66.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.67.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.67.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.68.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.68.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.69.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.69.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.70.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.70.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.71.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.71.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.72.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.72.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.73.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.73.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.74.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.74.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.75.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.75.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.76.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.76.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.77.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.77.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.78.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.78.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.79.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.79.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.80.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.80.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.81.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.81.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.82.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.82.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.83.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.83.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.84.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.84.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.85.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.85.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.86.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.86.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.87.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.87.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.88.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.88.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.89.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.89.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.90.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.90.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.91.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.91.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.92.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.92.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.93.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.93.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.94.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.94.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.95.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.95.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.96.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.96.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.97.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.97.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.98.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.98.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.99.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.99.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.100.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.100.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.101.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.101.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.102.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.102.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.103.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.103.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.104.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.104.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.105.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.105.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.106.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.106.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.107.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.107.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.108.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.108.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.109.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.109.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.110.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.110.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.111.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.111.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.112.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.112.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.113.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.113.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.114.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.114.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.115.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.115.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.116.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.116.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.117.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.117.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.118.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.118.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.119.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.119.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.120.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.120.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.121.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.121.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.122.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.122.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.123.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.123.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.124.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.124.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.125.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.125.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.126.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.126.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.127.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.127.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.128.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.128.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.129.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.129.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.130.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.130.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.131.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.131.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.132.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.132.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.133.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.133.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.134.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.134.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.135.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.135.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.136.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.136.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.137.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.137.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.138.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.138.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.139.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.139.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.140.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.140.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.141.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.141.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.142.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.142.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.143.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.143.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.144.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.144.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.145.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.145.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.146.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.146.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.147.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.147.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.148.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.148.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.149.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.149.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.150.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.150.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.151.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.151.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.152.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.152.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.153.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.153.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.154.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.154.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.155.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.155.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.156.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.156.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.157.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.157.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.158.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.158.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.159.gate_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.159.up_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.0.down_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.1.down_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.2.down_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.3.down_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.4.down_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.5.down_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.6.down_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.7.down_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.8.down_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.9.down_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.10.down_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.11.down_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.12.down_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.13.down_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.14.down_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.15.down_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.16.down_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.17.down_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.18.down_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.19.down_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.20.down_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.21.down_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.22.down_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.23.down_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.24.down_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.25.down_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.26.down_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.27.down_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.28.down_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.29.down_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.30.down_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.31.down_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.32.down_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.33.down_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.34.down_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.35.down_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.36.down_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.37.down_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.38.down_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.39.down_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.40.down_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.41.down_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.42.down_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.43.down_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.44.down_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.45.down_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.46.down_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.47.down_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.48.down_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.49.down_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.50.down_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.51.down_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.52.down_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.53.down_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.54.down_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.55.down_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.56.down_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.57.down_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.58.down_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.59.down_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.60.down_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.61.down_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.62.down_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.63.down_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.64.down_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.65.down_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.66.down_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.67.down_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.68.down_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.69.down_proj.weight": "model-00015-of-00132.safetensors", + "model.layers.13.mlp.experts.70.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.71.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.72.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.73.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.74.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.75.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.76.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.77.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.78.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.79.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.80.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.81.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.82.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.83.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.84.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.85.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.86.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.87.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.88.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.89.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.90.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.91.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.92.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.93.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.94.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.95.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.96.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.97.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.98.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.99.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.100.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.101.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.102.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.103.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.104.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.105.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.106.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.107.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.108.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.109.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.110.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.111.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.112.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.113.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.114.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.115.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.116.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.117.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.118.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.119.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.120.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.121.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.122.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.123.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.124.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.125.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.126.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.127.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.128.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.129.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.130.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.131.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.132.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.133.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.134.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.135.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.136.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.137.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.138.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.139.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.140.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.141.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.142.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.143.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.144.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.145.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.146.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.147.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.148.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.149.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.150.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.151.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.152.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.153.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.154.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.155.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.156.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.157.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.158.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.experts.159.down_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.shared_experts.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.13.mlp.shared_experts.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.self_attn.o_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.self_attn.q_proj.bias": "model-00016-of-00132.safetensors", + "model.layers.14.self_attn.k_proj.bias": "model-00016-of-00132.safetensors", + "model.layers.14.self_attn.v_proj.bias": "model-00016-of-00132.safetensors", + "model.layers.14.self_attn.q_norm.weight": "model-00016-of-00132.safetensors", + "model.layers.14.post_attention_layernorm.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.gate.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.0.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.0.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.1.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.1.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.2.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.2.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.3.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.3.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.4.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.4.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.5.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.5.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.6.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.6.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.7.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.7.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.8.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.8.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.9.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.9.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.10.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.10.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.11.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.11.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.12.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.12.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.13.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.13.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.14.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.14.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.15.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.15.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.16.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.16.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.17.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.17.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.18.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.18.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.19.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.19.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.20.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.20.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.21.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.21.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.22.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.22.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.23.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.23.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.24.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.24.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.25.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.25.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.26.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.26.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.27.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.27.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.28.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.28.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.29.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.29.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.30.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.30.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.31.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.31.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.32.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.32.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.33.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.33.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.34.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.34.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.35.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.35.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.36.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.36.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.37.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.37.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.38.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.38.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.39.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.39.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.40.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.40.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.41.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.41.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.42.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.42.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.43.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.43.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.44.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.44.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.45.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.45.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.46.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.46.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.47.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.47.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.48.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.48.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.49.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.49.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.50.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.50.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.51.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.51.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.52.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.52.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.53.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.53.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.54.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.54.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.55.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.55.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.56.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.56.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.57.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.57.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.58.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.58.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.59.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.59.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.60.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.60.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.61.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.61.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.62.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.62.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.63.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.63.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.64.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.64.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.65.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.65.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.66.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.66.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.67.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.67.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.68.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.68.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.69.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.69.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.70.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.70.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.71.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.71.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.72.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.72.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.73.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.73.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.74.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.74.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.75.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.75.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.76.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.76.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.77.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.77.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.78.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.78.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.79.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.79.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.80.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.80.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.81.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.81.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.82.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.82.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.83.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.83.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.84.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.84.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.85.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.85.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.86.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.86.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.87.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.87.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.88.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.88.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.89.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.89.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.90.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.90.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.91.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.91.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.92.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.92.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.93.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.93.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.94.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.94.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.95.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.95.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.96.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.96.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.97.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.97.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.98.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.98.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.99.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.99.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.100.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.100.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.101.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.101.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.102.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.102.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.103.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.103.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.104.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.104.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.105.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.105.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.106.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.106.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.107.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.107.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.108.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.108.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.109.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.109.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.110.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.110.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.111.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.111.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.112.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.112.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.113.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.113.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.114.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.114.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.115.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.115.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.116.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.116.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.117.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.117.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.118.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.118.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.119.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.119.up_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.120.gate_proj.weight": "model-00016-of-00132.safetensors", + "model.layers.14.mlp.experts.120.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.121.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.121.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.122.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.122.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.123.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.123.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.124.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.124.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.125.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.125.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.126.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.126.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.127.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.127.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.128.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.128.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.129.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.129.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.130.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.130.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.131.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.131.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.132.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.132.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.133.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.133.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.134.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.134.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.135.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.135.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.136.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.136.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.137.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.137.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.138.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.138.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.139.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.139.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.140.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.140.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.141.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.141.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.142.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.142.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.143.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.143.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.144.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.144.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.145.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.145.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.146.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.146.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.147.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.147.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.148.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.148.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.149.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.149.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.150.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.150.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.151.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.151.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.152.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.152.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.153.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.153.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.154.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.154.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.155.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.155.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.156.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.156.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.157.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.157.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.158.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.158.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.159.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.159.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.0.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.1.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.2.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.3.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.4.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.5.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.6.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.7.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.8.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.9.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.10.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.11.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.12.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.13.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.14.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.15.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.16.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.17.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.18.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.19.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.20.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.21.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.22.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.23.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.24.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.25.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.26.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.27.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.28.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.29.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.30.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.31.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.32.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.33.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.34.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.35.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.36.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.37.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.38.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.39.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.40.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.41.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.42.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.43.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.44.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.45.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.46.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.47.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.48.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.49.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.50.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.51.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.52.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.53.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.54.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.55.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.56.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.57.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.58.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.59.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.60.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.61.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.62.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.63.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.64.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.65.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.66.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.67.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.68.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.69.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.70.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.71.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.72.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.73.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.74.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.75.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.76.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.77.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.78.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.79.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.80.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.81.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.82.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.83.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.84.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.85.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.86.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.87.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.88.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.89.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.90.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.91.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.92.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.93.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.94.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.95.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.96.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.97.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.98.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.99.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.100.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.101.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.102.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.103.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.104.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.105.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.106.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.107.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.108.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.109.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.110.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.111.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.112.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.113.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.114.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.115.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.116.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.117.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.118.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.119.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.120.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.121.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.122.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.123.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.124.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.125.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.126.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.127.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.128.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.129.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.130.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.131.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.132.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.133.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.134.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.135.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.136.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.137.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.138.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.139.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.140.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.141.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.142.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.143.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.144.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.145.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.146.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.147.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.148.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.149.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.150.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.151.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.152.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.153.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.154.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.155.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.156.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.157.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.158.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.experts.159.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.shared_experts.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.shared_experts.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.14.mlp.shared_experts.down_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.self_attn.q_norm.weight": "model-00017-of-00132.safetensors", + "model.layers.15.post_attention_layernorm.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.0.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.0.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.1.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.1.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.2.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.2.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.3.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.3.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.4.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.4.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.5.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.5.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.6.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.6.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.7.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.7.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.8.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.8.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.9.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.9.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.10.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.10.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.11.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.11.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.12.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.12.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.13.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.13.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.14.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.14.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.15.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.15.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.16.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.16.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.17.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.17.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.18.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.18.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.19.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.19.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.20.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.20.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.21.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.21.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.22.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.22.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.23.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.23.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.24.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.24.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.25.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.25.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.26.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.26.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.27.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.27.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.28.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.28.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.29.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.29.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.30.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.30.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.31.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.31.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.32.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.32.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.33.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.33.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.34.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.34.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.35.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.35.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.36.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.36.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.37.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.37.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.38.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.38.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.39.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.39.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.40.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.40.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.41.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.41.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.42.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.42.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.43.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.43.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.44.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.44.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.45.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.45.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.46.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.46.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.47.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.47.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.48.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.48.up_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.49.gate_proj.weight": "model-00017-of-00132.safetensors", + "model.layers.15.mlp.experts.49.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.50.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.50.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.51.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.51.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.52.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.52.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.53.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.53.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.54.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.54.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.55.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.55.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.56.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.56.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.57.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.57.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.58.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.58.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.59.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.59.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.60.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.60.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.61.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.61.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.62.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.62.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.63.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.63.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.64.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.64.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.65.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.65.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.66.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.66.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.67.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.67.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.68.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.68.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.69.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.69.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.70.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.70.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.71.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.71.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.72.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.72.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.73.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.73.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.74.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.74.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.75.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.75.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.76.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.76.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.77.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.77.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.78.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.78.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.79.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.79.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.80.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.80.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.81.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.81.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.82.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.82.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.83.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.83.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.84.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.84.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.85.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.85.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.86.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.86.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.87.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.87.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.88.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.88.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.89.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.89.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.90.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.90.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.91.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.91.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.92.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.92.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.93.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.93.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.94.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.94.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.95.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.95.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.96.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.96.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.97.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.97.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.98.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.98.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.99.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.99.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.100.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.100.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.101.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.101.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.102.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.102.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.103.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.103.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.104.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.104.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.105.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.105.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.106.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.106.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.107.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.107.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.108.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.108.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.109.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.109.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.110.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.110.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.111.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.111.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.112.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.112.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.113.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.113.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.114.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.114.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.115.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.115.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.116.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.116.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.117.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.117.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.118.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.118.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.119.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.119.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.120.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.120.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.121.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.121.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.122.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.122.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.123.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.123.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.124.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.124.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.125.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.125.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.126.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.126.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.127.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.127.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.128.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.128.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.129.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.129.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.130.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.130.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.131.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.131.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.132.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.132.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.133.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.133.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.134.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.134.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.135.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.135.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.136.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.136.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.137.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.137.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.138.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.138.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.139.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.139.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.140.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.140.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.141.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.141.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.142.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.142.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.143.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.143.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.144.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.144.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.145.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.145.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.146.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.146.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.147.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.147.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.148.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.148.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.149.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.149.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.150.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.150.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.151.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.151.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.152.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.152.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.153.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.153.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.154.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.154.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.155.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.155.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.156.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.156.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.157.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.157.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.158.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.158.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.159.gate_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.159.up_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.0.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.1.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.2.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.3.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.4.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.5.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.6.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.7.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.8.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.9.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.10.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.11.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.12.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.13.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.14.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.15.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.16.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.17.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.18.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.19.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.20.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.21.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.22.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.23.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.24.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.25.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.26.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.27.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.28.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.29.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.30.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.31.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.32.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.33.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.34.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.35.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.36.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.37.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.38.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.39.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.40.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.41.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.42.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.43.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.44.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.45.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.46.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.47.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.48.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.49.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.50.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.51.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.52.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.53.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.54.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.55.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.56.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.57.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.58.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.59.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.60.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.61.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.62.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.63.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.64.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.65.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.66.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.67.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.68.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.69.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.70.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.71.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.72.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.73.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.74.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.75.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.76.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.77.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.78.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.79.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.80.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.81.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.82.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.83.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.84.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.85.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.86.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.87.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.88.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.89.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.90.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.91.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.92.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.93.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.94.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.95.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.96.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.97.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.98.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.99.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.100.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.101.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.102.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.103.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.104.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.105.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.106.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.107.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.108.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.109.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.110.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.111.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.112.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.113.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.114.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.115.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.116.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.117.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.118.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.119.down_proj.weight": "model-00018-of-00132.safetensors", + "model.layers.15.mlp.experts.120.down_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.15.mlp.experts.121.down_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.15.mlp.experts.122.down_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.15.mlp.experts.123.down_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.15.mlp.experts.124.down_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.15.mlp.experts.125.down_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.15.mlp.experts.126.down_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.15.mlp.experts.127.down_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.15.mlp.experts.128.down_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.15.mlp.experts.129.down_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.15.mlp.experts.130.down_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.15.mlp.experts.131.down_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.15.mlp.experts.132.down_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.15.mlp.experts.133.down_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.15.mlp.experts.134.down_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.15.mlp.experts.135.down_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.15.mlp.experts.136.down_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.15.mlp.experts.137.down_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.15.mlp.experts.138.down_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.15.mlp.experts.139.down_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.15.mlp.experts.140.down_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.15.mlp.experts.141.down_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.15.mlp.experts.142.down_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.15.mlp.experts.143.down_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.15.mlp.experts.144.down_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.15.mlp.experts.145.down_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.15.mlp.experts.146.down_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.15.mlp.experts.147.down_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.15.mlp.experts.148.down_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.15.mlp.experts.149.down_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.15.mlp.experts.150.down_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.15.mlp.experts.151.down_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.15.mlp.experts.152.down_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.15.mlp.experts.153.down_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.15.mlp.experts.154.down_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.15.mlp.experts.155.down_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.15.mlp.experts.156.down_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.15.mlp.experts.157.down_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.15.mlp.experts.158.down_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.15.mlp.experts.159.down_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.15.mlp.shared_experts.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.15.mlp.shared_experts.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.self_attn.o_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.self_attn.q_proj.bias": "model-00019-of-00132.safetensors", + "model.layers.16.self_attn.k_proj.bias": "model-00019-of-00132.safetensors", + "model.layers.16.self_attn.v_proj.bias": "model-00019-of-00132.safetensors", + "model.layers.16.self_attn.q_norm.weight": "model-00019-of-00132.safetensors", + "model.layers.16.post_attention_layernorm.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.gate.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.gate.e_score_correction_bias": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.0.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.0.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.1.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.1.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.2.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.2.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.3.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.3.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.4.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.4.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.5.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.5.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.6.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.6.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.7.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.7.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.8.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.8.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.9.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.9.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.10.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.10.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.11.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.11.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.12.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.12.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.13.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.13.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.14.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.14.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.15.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.15.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.16.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.16.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.17.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.17.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.18.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.18.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.19.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.19.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.20.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.20.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.21.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.21.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.22.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.22.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.23.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.23.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.24.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.24.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.25.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.25.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.26.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.26.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.27.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.27.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.28.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.28.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.29.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.29.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.30.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.30.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.31.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.31.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.32.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.32.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.33.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.33.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.34.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.34.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.35.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.35.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.36.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.36.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.37.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.37.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.38.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.38.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.39.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.39.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.40.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.40.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.41.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.41.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.42.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.42.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.43.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.43.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.44.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.44.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.45.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.45.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.46.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.46.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.47.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.47.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.48.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.48.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.49.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.49.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.50.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.50.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.51.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.51.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.52.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.52.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.53.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.53.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.54.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.54.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.55.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.55.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.56.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.56.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.57.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.57.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.58.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.58.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.59.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.59.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.60.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.60.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.61.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.61.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.62.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.62.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.63.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.63.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.64.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.64.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.65.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.65.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.66.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.66.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.67.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.67.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.68.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.68.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.69.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.69.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.70.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.70.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.71.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.71.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.72.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.72.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.73.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.73.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.74.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.74.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.75.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.75.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.76.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.76.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.77.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.77.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.78.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.78.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.79.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.79.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.80.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.80.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.81.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.81.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.82.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.82.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.83.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.83.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.84.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.84.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.85.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.85.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.86.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.86.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.87.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.87.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.88.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.88.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.89.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.89.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.90.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.90.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.91.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.91.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.92.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.92.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.93.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.93.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.94.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.94.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.95.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.95.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.96.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.96.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.97.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.97.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.98.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.98.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.99.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.99.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.100.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.100.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.101.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.101.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.102.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.102.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.103.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.103.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.104.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.104.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.105.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.105.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.106.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.106.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.107.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.107.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.108.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.108.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.109.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.109.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.110.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.110.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.111.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.111.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.112.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.112.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.113.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.113.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.114.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.114.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.115.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.115.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.116.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.116.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.117.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.117.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.118.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.118.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.119.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.119.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.120.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.120.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.121.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.121.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.122.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.122.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.123.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.123.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.124.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.124.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.125.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.125.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.126.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.126.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.127.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.127.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.128.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.128.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.129.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.129.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.130.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.130.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.131.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.131.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.132.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.132.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.133.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.133.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.134.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.134.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.135.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.135.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.136.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.136.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.137.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.137.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.138.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.138.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.139.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.139.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.140.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.140.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.141.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.141.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.142.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.142.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.143.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.143.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.144.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.144.up_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.145.gate_proj.weight": "model-00019-of-00132.safetensors", + "model.layers.16.mlp.experts.145.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.146.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.146.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.147.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.147.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.148.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.148.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.149.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.149.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.150.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.150.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.151.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.151.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.152.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.152.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.153.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.153.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.154.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.154.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.155.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.155.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.156.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.156.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.157.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.157.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.158.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.158.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.159.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.159.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.0.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.1.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.2.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.3.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.4.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.5.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.6.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.7.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.8.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.9.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.10.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.11.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.12.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.13.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.14.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.15.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.16.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.17.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.18.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.19.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.20.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.21.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.22.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.23.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.24.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.25.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.26.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.27.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.28.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.29.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.30.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.31.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.32.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.33.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.34.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.35.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.36.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.37.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.38.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.39.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.40.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.41.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.42.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.43.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.44.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.45.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.46.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.47.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.48.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.49.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.50.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.51.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.52.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.53.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.54.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.55.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.56.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.57.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.58.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.59.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.60.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.61.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.62.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.63.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.64.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.65.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.66.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.67.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.68.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.69.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.70.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.71.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.72.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.73.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.74.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.75.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.76.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.77.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.78.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.79.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.80.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.81.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.82.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.83.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.84.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.85.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.86.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.87.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.88.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.89.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.90.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.91.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.92.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.93.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.94.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.95.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.96.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.97.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.98.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.99.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.100.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.101.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.102.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.103.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.104.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.105.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.106.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.107.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.108.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.109.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.110.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.111.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.112.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.113.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.114.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.115.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.116.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.117.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.118.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.119.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.120.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.121.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.122.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.123.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.124.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.125.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.126.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.127.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.128.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.129.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.130.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.131.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.132.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.133.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.134.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.135.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.136.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.137.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.138.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.139.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.140.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.141.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.142.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.143.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.144.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.145.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.146.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.147.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.148.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.149.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.150.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.151.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.152.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.153.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.154.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.155.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.156.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.157.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.158.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.experts.159.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.shared_experts.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.shared_experts.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.16.mlp.shared_experts.down_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.self_attn.q_norm.weight": "model-00020-of-00132.safetensors", + "model.layers.17.post_attention_layernorm.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.0.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.0.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.1.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.1.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.2.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.2.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.3.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.3.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.4.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.4.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.5.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.5.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.6.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.6.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.7.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.7.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.8.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.8.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.9.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.9.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.10.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.10.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.11.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.11.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.12.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.12.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.13.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.13.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.14.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.14.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.15.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.15.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.16.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.16.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.17.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.17.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.18.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.18.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.19.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.19.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.20.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.20.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.21.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.21.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.22.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.22.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.23.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.23.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.24.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.24.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.25.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.25.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.26.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.26.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.27.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.27.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.28.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.28.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.29.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.29.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.30.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.30.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.31.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.31.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.32.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.32.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.33.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.33.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.34.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.34.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.35.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.35.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.36.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.36.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.37.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.37.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.38.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.38.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.39.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.39.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.40.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.40.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.41.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.41.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.42.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.42.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.43.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.43.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.44.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.44.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.45.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.45.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.46.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.46.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.47.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.47.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.48.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.48.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.49.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.49.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.50.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.50.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.51.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.51.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.52.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.52.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.53.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.53.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.54.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.54.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.55.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.55.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.56.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.56.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.57.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.57.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.58.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.58.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.59.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.59.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.60.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.60.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.61.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.61.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.62.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.62.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.63.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.63.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.64.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.64.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.65.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.65.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.66.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.66.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.67.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.67.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.68.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.68.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.69.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.69.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.70.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.70.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.71.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.71.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.72.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.72.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.73.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.73.up_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.74.gate_proj.weight": "model-00020-of-00132.safetensors", + "model.layers.17.mlp.experts.74.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.75.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.75.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.76.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.76.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.77.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.77.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.78.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.78.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.79.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.79.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.80.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.80.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.81.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.81.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.82.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.82.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.83.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.83.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.84.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.84.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.85.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.85.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.86.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.86.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.87.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.87.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.88.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.88.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.89.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.89.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.90.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.90.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.91.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.91.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.92.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.92.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.93.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.93.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.94.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.94.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.95.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.95.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.96.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.96.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.97.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.97.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.98.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.98.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.99.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.99.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.100.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.100.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.101.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.101.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.102.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.102.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.103.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.103.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.104.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.104.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.105.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.105.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.106.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.106.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.107.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.107.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.108.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.108.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.109.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.109.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.110.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.110.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.111.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.111.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.112.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.112.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.113.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.113.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.114.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.114.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.115.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.115.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.116.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.116.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.117.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.117.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.118.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.118.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.119.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.119.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.120.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.120.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.121.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.121.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.122.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.122.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.123.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.123.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.124.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.124.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.125.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.125.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.126.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.126.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.127.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.127.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.128.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.128.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.129.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.129.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.130.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.130.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.131.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.131.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.132.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.132.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.133.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.133.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.134.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.134.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.135.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.135.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.136.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.136.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.137.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.137.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.138.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.138.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.139.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.139.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.140.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.140.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.141.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.141.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.142.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.142.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.143.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.143.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.144.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.144.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.145.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.145.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.146.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.146.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.147.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.147.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.148.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.148.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.149.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.149.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.150.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.150.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.151.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.151.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.152.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.152.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.153.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.153.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.154.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.154.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.155.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.155.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.156.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.156.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.157.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.157.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.158.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.158.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.159.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.159.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.0.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.1.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.2.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.3.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.4.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.5.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.6.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.7.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.8.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.9.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.10.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.11.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.12.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.13.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.14.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.15.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.16.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.17.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.18.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.19.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.20.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.21.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.22.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.23.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.24.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.25.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.26.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.27.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.28.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.29.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.30.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.31.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.32.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.33.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.34.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.35.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.36.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.37.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.38.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.39.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.40.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.41.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.42.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.43.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.44.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.45.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.46.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.47.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.48.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.49.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.50.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.51.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.52.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.53.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.54.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.55.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.56.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.57.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.58.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.59.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.60.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.61.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.62.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.63.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.64.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.65.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.66.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.67.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.68.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.69.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.70.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.71.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.72.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.73.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.74.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.75.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.76.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.77.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.78.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.79.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.80.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.81.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.82.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.83.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.84.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.85.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.86.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.87.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.88.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.89.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.90.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.91.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.92.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.93.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.94.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.95.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.96.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.97.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.98.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.99.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.100.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.101.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.102.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.103.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.104.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.105.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.106.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.107.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.108.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.109.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.110.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.111.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.112.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.113.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.114.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.115.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.116.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.117.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.118.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.119.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.120.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.121.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.122.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.123.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.124.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.125.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.126.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.127.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.128.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.129.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.130.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.131.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.132.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.133.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.134.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.135.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.136.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.137.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.138.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.139.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.140.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.141.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.142.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.143.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.144.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.145.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.146.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.147.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.148.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.149.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.150.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.151.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.152.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.153.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.154.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.155.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.156.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.157.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.158.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.experts.159.down_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.shared_experts.gate_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.17.mlp.shared_experts.up_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.18.self_attn.o_proj.weight": "model-00021-of-00132.safetensors", + "model.layers.18.self_attn.q_proj.bias": "model-00021-of-00132.safetensors", + "model.layers.18.self_attn.k_proj.bias": "model-00021-of-00132.safetensors", + "model.layers.18.self_attn.v_proj.bias": "model-00021-of-00132.safetensors", + "model.layers.18.self_attn.q_norm.weight": "model-00021-of-00132.safetensors", + "model.layers.18.post_attention_layernorm.weight": "model-00021-of-00132.safetensors", + "model.layers.18.mlp.gate.weight": "model-00021-of-00132.safetensors", + "model.layers.18.mlp.gate.e_score_correction_bias": "model-00021-of-00132.safetensors", + "model.layers.18.mlp.experts.0.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.0.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.1.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.1.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.2.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.2.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.3.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.3.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.4.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.4.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.5.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.5.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.6.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.6.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.7.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.7.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.8.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.8.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.9.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.9.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.10.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.10.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.11.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.11.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.12.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.12.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.13.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.13.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.14.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.14.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.15.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.15.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.16.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.16.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.17.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.17.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.18.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.18.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.19.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.19.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.20.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.20.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.21.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.21.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.22.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.22.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.23.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.23.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.24.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.24.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.25.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.25.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.26.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.26.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.27.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.27.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.28.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.28.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.29.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.29.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.30.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.30.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.31.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.31.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.32.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.32.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.33.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.33.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.34.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.34.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.35.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.35.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.36.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.36.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.37.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.37.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.38.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.38.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.39.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.39.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.40.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.40.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.41.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.41.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.42.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.42.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.43.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.43.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.44.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.44.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.45.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.45.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.46.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.46.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.47.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.47.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.48.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.48.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.49.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.49.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.50.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.50.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.51.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.51.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.52.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.52.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.53.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.53.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.54.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.54.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.55.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.55.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.56.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.56.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.57.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.57.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.58.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.58.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.59.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.59.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.60.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.60.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.61.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.61.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.62.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.62.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.63.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.63.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.64.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.64.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.65.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.65.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.66.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.66.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.67.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.67.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.68.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.68.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.69.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.69.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.70.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.70.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.71.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.71.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.72.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.72.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.73.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.73.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.74.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.74.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.75.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.75.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.76.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.76.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.77.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.77.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.78.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.78.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.79.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.79.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.80.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.80.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.81.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.81.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.82.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.82.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.83.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.83.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.84.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.84.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.85.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.85.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.86.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.86.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.87.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.87.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.88.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.88.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.89.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.89.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.90.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.90.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.91.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.91.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.92.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.92.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.93.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.93.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.94.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.94.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.95.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.95.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.96.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.96.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.97.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.97.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.98.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.98.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.99.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.99.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.100.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.100.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.101.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.101.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.102.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.102.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.103.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.103.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.104.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.104.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.105.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.105.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.106.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.106.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.107.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.107.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.108.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.108.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.109.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.109.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.110.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.110.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.111.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.111.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.112.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.112.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.113.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.113.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.114.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.114.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.115.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.115.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.116.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.116.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.117.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.117.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.118.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.118.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.119.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.119.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.120.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.120.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.121.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.121.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.122.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.122.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.123.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.123.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.124.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.124.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.125.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.125.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.126.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.126.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.127.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.127.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.128.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.128.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.129.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.129.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.130.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.130.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.131.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.131.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.132.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.132.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.133.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.133.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.134.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.134.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.135.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.135.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.136.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.136.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.137.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.137.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.138.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.138.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.139.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.139.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.140.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.140.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.141.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.141.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.142.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.142.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.143.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.143.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.144.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.144.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.145.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.145.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.146.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.146.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.147.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.147.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.148.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.148.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.149.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.149.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.150.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.150.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.151.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.151.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.152.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.152.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.153.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.153.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.154.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.154.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.155.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.155.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.156.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.156.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.157.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.157.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.158.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.158.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.159.gate_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.159.up_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.0.down_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.1.down_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.2.down_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.3.down_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.4.down_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.5.down_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.6.down_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.7.down_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.8.down_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.9.down_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.10.down_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.11.down_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.12.down_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.13.down_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.14.down_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.15.down_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.16.down_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.17.down_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.18.down_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.19.down_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.20.down_proj.weight": "model-00022-of-00132.safetensors", + "model.layers.18.mlp.experts.21.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.22.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.23.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.24.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.25.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.26.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.27.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.28.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.29.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.30.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.31.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.32.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.33.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.34.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.35.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.36.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.37.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.38.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.39.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.40.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.41.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.42.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.43.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.44.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.45.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.46.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.47.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.48.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.49.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.50.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.51.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.52.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.53.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.54.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.55.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.56.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.57.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.58.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.59.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.60.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.61.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.62.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.63.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.64.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.65.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.66.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.67.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.68.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.69.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.70.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.71.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.72.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.73.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.74.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.75.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.76.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.77.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.78.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.79.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.80.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.81.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.82.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.83.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.84.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.85.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.86.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.87.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.88.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.89.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.90.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.91.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.92.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.93.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.94.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.95.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.96.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.97.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.98.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.99.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.100.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.101.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.102.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.103.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.104.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.105.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.106.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.107.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.108.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.109.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.110.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.111.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.112.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.113.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.114.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.115.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.116.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.117.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.118.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.119.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.120.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.121.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.122.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.123.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.124.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.125.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.126.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.127.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.128.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.129.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.130.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.131.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.132.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.133.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.134.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.135.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.136.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.137.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.138.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.139.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.140.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.141.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.142.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.143.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.144.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.145.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.146.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.147.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.148.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.149.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.150.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.151.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.152.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.153.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.154.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.155.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.156.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.157.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.158.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.experts.159.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.shared_experts.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.shared_experts.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.18.mlp.shared_experts.down_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.self_attn.q_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.self_attn.k_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.self_attn.v_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.self_attn.q_norm.weight": "model-00023-of-00132.safetensors", + "model.layers.19.post_attention_layernorm.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.0.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.0.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.1.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.1.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.2.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.2.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.3.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.3.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.4.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.4.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.5.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.5.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.6.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.6.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.7.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.7.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.8.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.8.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.9.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.9.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.10.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.10.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.11.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.11.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.12.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.12.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.13.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.13.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.14.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.14.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.15.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.15.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.16.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.16.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.17.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.17.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.18.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.18.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.19.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.19.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.20.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.20.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.21.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.21.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.22.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.22.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.23.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.23.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.24.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.24.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.25.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.25.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.26.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.26.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.27.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.27.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.28.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.28.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.29.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.29.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.30.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.30.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.31.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.31.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.32.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.32.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.33.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.33.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.34.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.34.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.35.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.35.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.36.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.36.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.37.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.37.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.38.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.38.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.39.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.39.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.40.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.40.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.41.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.41.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.42.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.42.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.43.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.43.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.44.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.44.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.45.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.45.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.46.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.46.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.47.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.47.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.48.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.48.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.49.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.49.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.50.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.50.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.51.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.51.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.52.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.52.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.53.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.53.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.54.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.54.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.55.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.55.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.56.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.56.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.57.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.57.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.58.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.58.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.59.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.59.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.60.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.60.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.61.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.61.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.62.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.62.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.63.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.63.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.64.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.64.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.65.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.65.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.66.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.66.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.67.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.67.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.68.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.68.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.69.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.69.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.70.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.70.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.71.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.71.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.72.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.72.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.73.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.73.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.74.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.74.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.75.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.75.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.76.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.76.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.77.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.77.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.78.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.78.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.79.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.79.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.80.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.80.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.81.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.81.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.82.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.82.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.83.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.83.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.84.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.84.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.85.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.85.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.86.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.86.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.87.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.87.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.88.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.88.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.89.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.89.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.90.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.90.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.91.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.91.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.92.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.92.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.93.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.93.up_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.94.gate_proj.weight": "model-00023-of-00132.safetensors", + "model.layers.19.mlp.experts.94.up_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.95.gate_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.95.up_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.96.gate_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.96.up_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.97.gate_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.97.up_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.98.gate_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.98.up_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.99.gate_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.99.up_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.100.gate_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.100.up_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.101.gate_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.101.up_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.102.gate_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.102.up_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.103.gate_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.103.up_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.104.gate_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.104.up_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.105.gate_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.105.up_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.106.gate_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.106.up_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.107.gate_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.107.up_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.108.gate_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.108.up_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.109.gate_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.109.up_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.110.gate_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.110.up_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.111.gate_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.111.up_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.112.gate_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.112.up_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.113.gate_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.113.up_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.114.gate_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.114.up_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.115.gate_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.115.up_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.116.gate_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.116.up_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.117.gate_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.117.up_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.118.gate_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.118.up_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.119.gate_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.119.up_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.120.gate_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.120.up_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.121.gate_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.121.up_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.122.gate_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.122.up_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.123.gate_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.123.up_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.124.gate_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.124.up_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.125.gate_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.125.up_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.126.gate_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.126.up_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.127.gate_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.127.up_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.128.gate_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.128.up_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.129.gate_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.129.up_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.130.gate_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.130.up_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.131.gate_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.131.up_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.132.gate_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.132.up_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.133.gate_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.133.up_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.134.gate_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.134.up_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.135.gate_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.135.up_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.136.gate_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.136.up_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.137.gate_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.137.up_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.138.gate_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.138.up_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.139.gate_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.139.up_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.140.gate_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.140.up_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.141.gate_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.141.up_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.142.gate_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.142.up_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.143.gate_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.143.up_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.144.gate_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.144.up_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.145.gate_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.145.up_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.146.gate_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.146.up_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.147.gate_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.147.up_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.148.gate_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.148.up_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.149.gate_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.149.up_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.150.gate_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.150.up_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.151.gate_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.151.up_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.152.gate_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.152.up_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.153.gate_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.153.up_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.154.gate_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.154.up_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.155.gate_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.155.up_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.156.gate_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.156.up_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.157.gate_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.157.up_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.158.gate_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.158.up_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.159.gate_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.159.up_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.0.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.1.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.2.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.3.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.4.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.5.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.6.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.7.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.8.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.9.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.10.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.11.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.12.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.13.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.14.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.15.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.16.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.17.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.18.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.19.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.20.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.21.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.22.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.23.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.24.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.25.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.26.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.27.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.28.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.29.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.30.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.31.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.32.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.33.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.34.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.35.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.36.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.37.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.38.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.39.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.40.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.41.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.42.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.43.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.44.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.45.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.46.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.47.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.48.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.49.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.50.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.51.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.52.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.53.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.54.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.55.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.56.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.57.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.58.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.59.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.60.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.61.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.62.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.63.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.64.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.65.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.66.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.67.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.68.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.69.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.70.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.71.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.72.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.73.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.74.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.75.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.76.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.77.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.78.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.79.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.80.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.81.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.82.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.83.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.84.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.85.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.86.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.87.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.88.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.89.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.90.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.91.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.92.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.93.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.94.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.95.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.96.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.97.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.98.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.99.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.100.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.101.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.102.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.103.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.104.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.105.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.106.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.107.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.108.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.109.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.110.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.111.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.112.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.113.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.114.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.115.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.116.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.117.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.118.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.119.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.120.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.121.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.122.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.123.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.124.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.125.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.126.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.127.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.128.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.129.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.130.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.131.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.132.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.133.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.134.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.135.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.136.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.137.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.138.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.139.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.140.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.141.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.142.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.143.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.144.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.145.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.146.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.147.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.148.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.149.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.150.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.151.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.152.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.153.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.154.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.155.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.156.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.157.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.158.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.experts.159.down_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.shared_experts.gate_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.19.mlp.shared_experts.up_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.20.self_attn.o_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.20.self_attn.q_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.20.self_attn.k_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.20.self_attn.v_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.20.self_attn.q_norm.weight": "model-00024-of-00132.safetensors", + "model.layers.20.post_attention_layernorm.weight": "model-00024-of-00132.safetensors", + "model.layers.20.mlp.gate.weight": "model-00024-of-00132.safetensors", + "model.layers.20.mlp.gate.e_score_correction_bias": "model-00024-of-00132.safetensors", + "model.layers.20.mlp.experts.0.gate_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.20.mlp.experts.0.up_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.20.mlp.experts.1.gate_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.20.mlp.experts.1.up_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.20.mlp.experts.2.gate_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.20.mlp.experts.2.up_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.20.mlp.experts.3.gate_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.20.mlp.experts.3.up_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.20.mlp.experts.4.gate_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.20.mlp.experts.4.up_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.20.mlp.experts.5.gate_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.20.mlp.experts.5.up_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.20.mlp.experts.6.gate_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.20.mlp.experts.6.up_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.20.mlp.experts.7.gate_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.20.mlp.experts.7.up_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.20.mlp.experts.8.gate_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.20.mlp.experts.8.up_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.20.mlp.experts.9.gate_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.20.mlp.experts.9.up_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.20.mlp.experts.10.gate_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.20.mlp.experts.10.up_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.20.mlp.experts.11.gate_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.20.mlp.experts.11.up_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.20.mlp.experts.12.gate_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.20.mlp.experts.12.up_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.20.mlp.experts.13.gate_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.20.mlp.experts.13.up_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.20.mlp.experts.14.gate_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.20.mlp.experts.14.up_proj.weight": "model-00024-of-00132.safetensors", + "model.layers.20.mlp.experts.15.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.15.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.16.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.16.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.17.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.17.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.18.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.18.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.19.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.19.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.20.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.20.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.21.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.21.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.22.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.22.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.23.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.23.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.24.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.24.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.25.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.25.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.26.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.26.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.27.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.27.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.28.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.28.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.29.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.29.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.30.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.30.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.31.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.31.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.32.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.32.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.33.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.33.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.34.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.34.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.35.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.35.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.36.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.36.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.37.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.37.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.38.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.38.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.39.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.39.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.40.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.40.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.41.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.41.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.42.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.42.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.43.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.43.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.44.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.44.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.45.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.45.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.46.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.46.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.47.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.47.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.48.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.48.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.49.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.49.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.50.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.50.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.51.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.51.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.52.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.52.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.53.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.53.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.54.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.54.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.55.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.55.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.56.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.56.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.57.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.57.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.58.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.58.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.59.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.59.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.60.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.60.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.61.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.61.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.62.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.62.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.63.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.63.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.64.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.64.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.65.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.65.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.66.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.66.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.67.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.67.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.68.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.68.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.69.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.69.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.70.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.70.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.71.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.71.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.72.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.72.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.73.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.73.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.74.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.74.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.75.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.75.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.76.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.76.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.77.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.77.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.78.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.78.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.79.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.79.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.80.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.80.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.81.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.81.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.82.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.82.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.83.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.83.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.84.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.84.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.85.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.85.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.86.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.86.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.87.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.87.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.88.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.88.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.89.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.89.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.90.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.90.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.91.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.91.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.92.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.92.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.93.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.93.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.94.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.94.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.95.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.95.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.96.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.96.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.97.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.97.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.98.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.98.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.99.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.99.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.100.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.100.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.101.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.101.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.102.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.102.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.103.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.103.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.104.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.104.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.105.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.105.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.106.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.106.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.107.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.107.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.108.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.108.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.109.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.109.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.110.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.110.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.111.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.111.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.112.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.112.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.113.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.113.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.114.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.114.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.115.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.115.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.116.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.116.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.117.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.117.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.118.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.118.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.119.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.119.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.120.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.120.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.121.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.121.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.122.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.122.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.123.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.123.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.124.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.124.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.125.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.125.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.126.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.126.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.127.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.127.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.128.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.128.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.129.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.129.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.130.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.130.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.131.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.131.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.132.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.132.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.133.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.133.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.134.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.134.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.135.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.135.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.136.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.136.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.137.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.137.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.138.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.138.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.139.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.139.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.140.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.140.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.141.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.141.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.142.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.142.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.143.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.143.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.144.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.144.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.145.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.145.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.146.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.146.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.147.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.147.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.148.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.148.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.149.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.149.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.150.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.150.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.151.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.151.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.152.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.152.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.153.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.153.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.154.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.154.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.155.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.155.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.156.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.156.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.157.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.157.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.158.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.158.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.159.gate_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.159.up_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.0.down_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.1.down_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.2.down_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.3.down_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.4.down_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.5.down_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.6.down_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.7.down_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.8.down_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.9.down_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.10.down_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.11.down_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.12.down_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.13.down_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.14.down_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.15.down_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.16.down_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.17.down_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.18.down_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.19.down_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.20.down_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.21.down_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.22.down_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.23.down_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.24.down_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.25.down_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.26.down_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.27.down_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.28.down_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.29.down_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.30.down_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.31.down_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.32.down_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.33.down_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.34.down_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.35.down_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.36.down_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.37.down_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.38.down_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.39.down_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.40.down_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.41.down_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.42.down_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.43.down_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.44.down_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.45.down_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.46.down_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.47.down_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.48.down_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.49.down_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.50.down_proj.weight": "model-00025-of-00132.safetensors", + "model.layers.20.mlp.experts.51.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.52.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.53.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.54.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.55.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.56.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.57.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.58.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.59.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.60.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.61.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.62.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.63.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.64.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.65.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.66.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.67.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.68.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.69.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.70.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.71.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.72.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.73.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.74.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.75.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.76.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.77.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.78.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.79.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.80.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.81.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.82.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.83.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.84.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.85.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.86.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.87.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.88.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.89.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.90.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.91.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.92.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.93.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.94.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.95.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.96.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.97.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.98.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.99.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.100.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.101.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.102.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.103.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.104.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.105.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.106.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.107.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.108.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.109.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.110.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.111.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.112.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.113.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.114.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.115.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.116.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.117.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.118.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.119.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.120.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.121.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.122.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.123.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.124.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.125.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.126.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.127.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.128.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.129.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.130.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.131.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.132.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.133.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.134.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.135.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.136.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.137.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.138.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.139.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.140.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.141.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.142.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.143.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.144.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.145.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.146.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.147.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.148.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.149.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.150.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.151.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.152.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.153.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.154.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.155.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.156.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.157.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.158.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.experts.159.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.shared_experts.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.shared_experts.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.20.mlp.shared_experts.down_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.self_attn.q_proj.bias": "model-00026-of-00132.safetensors", + "model.layers.21.self_attn.k_proj.bias": "model-00026-of-00132.safetensors", + "model.layers.21.self_attn.v_proj.bias": "model-00026-of-00132.safetensors", + "model.layers.21.self_attn.q_norm.weight": "model-00026-of-00132.safetensors", + "model.layers.21.post_attention_layernorm.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.0.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.0.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.1.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.1.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.2.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.2.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.3.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.3.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.4.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.4.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.5.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.5.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.6.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.6.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.7.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.7.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.8.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.8.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.9.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.9.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.10.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.10.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.11.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.11.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.12.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.12.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.13.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.13.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.14.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.14.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.15.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.15.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.16.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.16.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.17.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.17.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.18.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.18.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.19.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.19.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.20.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.20.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.21.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.21.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.22.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.22.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.23.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.23.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.24.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.24.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.25.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.25.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.26.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.26.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.27.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.27.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.28.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.28.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.29.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.29.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.30.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.30.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.31.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.31.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.32.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.32.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.33.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.33.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.34.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.34.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.35.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.35.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.36.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.36.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.37.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.37.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.38.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.38.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.39.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.39.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.40.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.40.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.41.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.41.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.42.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.42.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.43.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.43.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.44.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.44.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.45.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.45.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.46.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.46.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.47.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.47.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.48.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.48.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.49.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.49.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.50.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.50.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.51.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.51.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.52.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.52.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.53.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.53.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.54.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.54.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.55.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.55.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.56.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.56.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.57.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.57.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.58.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.58.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.59.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.59.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.60.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.60.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.61.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.61.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.62.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.62.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.63.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.63.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.64.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.64.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.65.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.65.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.66.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.66.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.67.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.67.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.68.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.68.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.69.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.69.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.70.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.70.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.71.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.71.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.72.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.72.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.73.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.73.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.74.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.74.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.75.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.75.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.76.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.76.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.77.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.77.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.78.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.78.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.79.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.79.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.80.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.80.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.81.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.81.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.82.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.82.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.83.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.83.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.84.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.84.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.85.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.85.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.86.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.86.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.87.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.87.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.88.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.88.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.89.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.89.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.90.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.90.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.91.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.91.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.92.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.92.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.93.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.93.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.94.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.94.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.95.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.95.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.96.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.96.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.97.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.97.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.98.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.98.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.99.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.99.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.100.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.100.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.101.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.101.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.102.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.102.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.103.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.103.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.104.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.104.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.105.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.105.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.106.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.106.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.107.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.107.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.108.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.108.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.109.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.109.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.110.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.110.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.111.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.111.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.112.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.112.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.113.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.113.up_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.114.gate_proj.weight": "model-00026-of-00132.safetensors", + "model.layers.21.mlp.experts.114.up_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.115.gate_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.115.up_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.116.gate_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.116.up_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.117.gate_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.117.up_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.118.gate_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.118.up_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.119.gate_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.119.up_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.120.gate_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.120.up_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.121.gate_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.121.up_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.122.gate_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.122.up_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.123.gate_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.123.up_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.124.gate_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.124.up_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.125.gate_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.125.up_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.126.gate_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.126.up_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.127.gate_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.127.up_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.128.gate_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.128.up_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.129.gate_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.129.up_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.130.gate_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.130.up_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.131.gate_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.131.up_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.132.gate_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.132.up_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.133.gate_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.133.up_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.134.gate_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.134.up_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.135.gate_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.135.up_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.136.gate_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.136.up_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.137.gate_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.137.up_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.138.gate_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.138.up_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.139.gate_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.139.up_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.140.gate_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.140.up_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.141.gate_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.141.up_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.142.gate_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.142.up_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.143.gate_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.143.up_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.144.gate_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.144.up_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.145.gate_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.145.up_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.146.gate_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.146.up_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.147.gate_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.147.up_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.148.gate_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.148.up_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.149.gate_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.149.up_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.150.gate_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.150.up_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.151.gate_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.151.up_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.152.gate_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.152.up_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.153.gate_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.153.up_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.154.gate_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.154.up_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.155.gate_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.155.up_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.156.gate_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.156.up_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.157.gate_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.157.up_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.158.gate_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.158.up_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.159.gate_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.159.up_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.0.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.1.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.2.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.3.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.4.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.5.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.6.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.7.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.8.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.9.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.10.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.11.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.12.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.13.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.14.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.15.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.16.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.17.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.18.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.19.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.20.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.21.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.22.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.23.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.24.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.25.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.26.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.27.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.28.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.29.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.30.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.31.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.32.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.33.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.34.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.35.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.36.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.37.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.38.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.39.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.40.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.41.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.42.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.43.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.44.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.45.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.46.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.47.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.48.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.49.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.50.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.51.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.52.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.53.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.54.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.55.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.56.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.57.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.58.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.59.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.60.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.61.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.62.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.63.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.64.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.65.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.66.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.67.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.68.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.69.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.70.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.71.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.72.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.73.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.74.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.75.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.76.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.77.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.78.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.79.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.80.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.81.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.82.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.83.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.84.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.85.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.86.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.87.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.88.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.89.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.90.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.91.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.92.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.93.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.94.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.95.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.96.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.97.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.98.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.99.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.100.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.101.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.102.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.103.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.104.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.105.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.106.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.107.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.108.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.109.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.110.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.111.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.112.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.113.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.114.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.115.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.116.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.117.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.118.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.119.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.120.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.121.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.122.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.123.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.124.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.125.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.126.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.127.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.128.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.129.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.130.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.131.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.132.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.133.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.134.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.135.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.136.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.137.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.138.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.139.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.140.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.141.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.142.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.143.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.144.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.145.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.146.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.147.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.148.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.149.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.150.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.151.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.152.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.153.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.154.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.155.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.156.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.157.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.158.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.experts.159.down_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.shared_experts.gate_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.21.mlp.shared_experts.up_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.22.self_attn.o_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.22.self_attn.q_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.22.self_attn.k_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.22.self_attn.v_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.22.self_attn.q_norm.weight": "model-00027-of-00132.safetensors", + "model.layers.22.post_attention_layernorm.weight": "model-00027-of-00132.safetensors", + "model.layers.22.mlp.gate.weight": "model-00027-of-00132.safetensors", + "model.layers.22.mlp.gate.e_score_correction_bias": "model-00027-of-00132.safetensors", + "model.layers.22.mlp.experts.0.gate_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.22.mlp.experts.0.up_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.22.mlp.experts.1.gate_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.22.mlp.experts.1.up_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.22.mlp.experts.2.gate_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.22.mlp.experts.2.up_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.22.mlp.experts.3.gate_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.22.mlp.experts.3.up_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.22.mlp.experts.4.gate_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.22.mlp.experts.4.up_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.22.mlp.experts.5.gate_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.22.mlp.experts.5.up_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.22.mlp.experts.6.gate_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.22.mlp.experts.6.up_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.22.mlp.experts.7.gate_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.22.mlp.experts.7.up_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.22.mlp.experts.8.gate_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.22.mlp.experts.8.up_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.22.mlp.experts.9.gate_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.22.mlp.experts.9.up_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.22.mlp.experts.10.gate_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.22.mlp.experts.10.up_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.22.mlp.experts.11.gate_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.22.mlp.experts.11.up_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.22.mlp.experts.12.gate_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.22.mlp.experts.12.up_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.22.mlp.experts.13.gate_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.22.mlp.experts.13.up_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.22.mlp.experts.14.gate_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.22.mlp.experts.14.up_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.22.mlp.experts.15.gate_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.22.mlp.experts.15.up_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.22.mlp.experts.16.gate_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.22.mlp.experts.16.up_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.22.mlp.experts.17.gate_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.22.mlp.experts.17.up_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.22.mlp.experts.18.gate_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.22.mlp.experts.18.up_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.22.mlp.experts.19.gate_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.22.mlp.experts.19.up_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.22.mlp.experts.20.gate_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.22.mlp.experts.20.up_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.22.mlp.experts.21.gate_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.22.mlp.experts.21.up_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.22.mlp.experts.22.gate_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.22.mlp.experts.22.up_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.22.mlp.experts.23.gate_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.22.mlp.experts.23.up_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.22.mlp.experts.24.gate_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.22.mlp.experts.24.up_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.22.mlp.experts.25.gate_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.22.mlp.experts.25.up_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.22.mlp.experts.26.gate_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.22.mlp.experts.26.up_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.22.mlp.experts.27.gate_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.22.mlp.experts.27.up_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.22.mlp.experts.28.gate_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.22.mlp.experts.28.up_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.22.mlp.experts.29.gate_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.22.mlp.experts.29.up_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.22.mlp.experts.30.gate_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.22.mlp.experts.30.up_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.22.mlp.experts.31.gate_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.22.mlp.experts.31.up_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.22.mlp.experts.32.gate_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.22.mlp.experts.32.up_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.22.mlp.experts.33.gate_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.22.mlp.experts.33.up_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.22.mlp.experts.34.gate_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.22.mlp.experts.34.up_proj.weight": "model-00027-of-00132.safetensors", + "model.layers.22.mlp.experts.35.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.35.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.36.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.36.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.37.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.37.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.38.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.38.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.39.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.39.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.40.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.40.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.41.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.41.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.42.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.42.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.43.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.43.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.44.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.44.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.45.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.45.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.46.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.46.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.47.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.47.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.48.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.48.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.49.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.49.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.50.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.50.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.51.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.51.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.52.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.52.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.53.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.53.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.54.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.54.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.55.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.55.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.56.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.56.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.57.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.57.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.58.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.58.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.59.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.59.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.60.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.60.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.61.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.61.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.62.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.62.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.63.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.63.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.64.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.64.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.65.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.65.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.66.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.66.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.67.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.67.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.68.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.68.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.69.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.69.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.70.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.70.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.71.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.71.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.72.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.72.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.73.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.73.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.74.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.74.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.75.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.75.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.76.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.76.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.77.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.77.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.78.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.78.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.79.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.79.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.80.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.80.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.81.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.81.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.82.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.82.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.83.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.83.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.84.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.84.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.85.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.85.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.86.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.86.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.87.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.87.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.88.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.88.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.89.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.89.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.90.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.90.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.91.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.91.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.92.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.92.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.93.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.93.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.94.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.94.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.95.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.95.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.96.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.96.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.97.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.97.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.98.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.98.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.99.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.99.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.100.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.100.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.101.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.101.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.102.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.102.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.103.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.103.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.104.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.104.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.105.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.105.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.106.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.106.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.107.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.107.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.108.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.108.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.109.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.109.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.110.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.110.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.111.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.111.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.112.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.112.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.113.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.113.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.114.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.114.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.115.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.115.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.116.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.116.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.117.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.117.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.118.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.118.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.119.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.119.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.120.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.120.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.121.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.121.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.122.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.122.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.123.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.123.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.124.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.124.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.125.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.125.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.126.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.126.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.127.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.127.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.128.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.128.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.129.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.129.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.130.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.130.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.131.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.131.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.132.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.132.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.133.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.133.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.134.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.134.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.135.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.135.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.136.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.136.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.137.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.137.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.138.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.138.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.139.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.139.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.140.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.140.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.141.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.141.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.142.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.142.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.143.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.143.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.144.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.144.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.145.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.145.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.146.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.146.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.147.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.147.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.148.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.148.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.149.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.149.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.150.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.150.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.151.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.151.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.152.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.152.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.153.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.153.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.154.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.154.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.155.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.155.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.156.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.156.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.157.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.157.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.158.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.158.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.159.gate_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.159.up_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.0.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.1.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.2.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.3.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.4.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.5.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.6.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.7.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.8.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.9.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.10.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.11.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.12.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.13.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.14.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.15.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.16.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.17.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.18.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.19.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.20.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.21.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.22.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.23.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.24.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.25.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.26.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.27.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.28.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.29.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.30.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.31.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.32.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.33.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.34.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.35.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.36.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.37.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.38.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.39.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.40.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.41.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.42.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.43.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.44.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.45.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.46.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.47.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.48.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.49.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.50.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.51.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.52.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.53.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.54.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.55.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.56.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.57.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.58.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.59.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.60.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.61.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.62.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.63.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.64.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.65.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.66.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.67.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.68.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.69.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.70.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.71.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.72.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.73.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.74.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.75.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.76.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.77.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.78.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.79.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.80.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.81.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.82.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.83.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.84.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.85.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.86.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.87.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.88.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.89.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.90.down_proj.weight": "model-00028-of-00132.safetensors", + "model.layers.22.mlp.experts.91.down_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.22.mlp.experts.92.down_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.22.mlp.experts.93.down_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.22.mlp.experts.94.down_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.22.mlp.experts.95.down_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.22.mlp.experts.96.down_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.22.mlp.experts.97.down_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.22.mlp.experts.98.down_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.22.mlp.experts.99.down_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.22.mlp.experts.100.down_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.22.mlp.experts.101.down_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.22.mlp.experts.102.down_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.22.mlp.experts.103.down_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.22.mlp.experts.104.down_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.22.mlp.experts.105.down_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.22.mlp.experts.106.down_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.22.mlp.experts.107.down_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.22.mlp.experts.108.down_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.22.mlp.experts.109.down_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.22.mlp.experts.110.down_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.22.mlp.experts.111.down_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.22.mlp.experts.112.down_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.22.mlp.experts.113.down_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.22.mlp.experts.114.down_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.22.mlp.experts.115.down_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.22.mlp.experts.116.down_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.22.mlp.experts.117.down_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.22.mlp.experts.118.down_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.22.mlp.experts.119.down_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.22.mlp.experts.120.down_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.22.mlp.experts.121.down_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.22.mlp.experts.122.down_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.22.mlp.experts.123.down_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.22.mlp.experts.124.down_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.22.mlp.experts.125.down_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.22.mlp.experts.126.down_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.22.mlp.experts.127.down_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.22.mlp.experts.128.down_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.22.mlp.experts.129.down_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.22.mlp.experts.130.down_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.22.mlp.experts.131.down_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.22.mlp.experts.132.down_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.22.mlp.experts.133.down_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.22.mlp.experts.134.down_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.22.mlp.experts.135.down_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.22.mlp.experts.136.down_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.22.mlp.experts.137.down_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.22.mlp.experts.138.down_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.22.mlp.experts.139.down_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.22.mlp.experts.140.down_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.22.mlp.experts.141.down_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.22.mlp.experts.142.down_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.22.mlp.experts.143.down_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.22.mlp.experts.144.down_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.22.mlp.experts.145.down_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.22.mlp.experts.146.down_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.22.mlp.experts.147.down_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.22.mlp.experts.148.down_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.22.mlp.experts.149.down_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.22.mlp.experts.150.down_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.22.mlp.experts.151.down_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.22.mlp.experts.152.down_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.22.mlp.experts.153.down_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.22.mlp.experts.154.down_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.22.mlp.experts.155.down_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.22.mlp.experts.156.down_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.22.mlp.experts.157.down_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.22.mlp.experts.158.down_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.22.mlp.experts.159.down_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.22.mlp.shared_experts.gate_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.22.mlp.shared_experts.up_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.22.mlp.shared_experts.down_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.0.self_attn.o_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.0.input_layernorm.weight": "model-00029-of-00132.safetensors", + "model.layers.0.self_attn.q_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.0.self_attn.k_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.0.self_attn.v_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.1.self_attn.o_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.1.input_layernorm.weight": "model-00029-of-00132.safetensors", + "model.layers.1.self_attn.q_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.1.self_attn.k_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.1.self_attn.v_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.1.self_attn.q_proj.bias": "model-00029-of-00132.safetensors", + "model.layers.1.self_attn.k_proj.bias": "model-00029-of-00132.safetensors", + "model.layers.1.self_attn.v_proj.bias": "model-00029-of-00132.safetensors", + "model.layers.1.self_attn.k_norm.weight": "model-00029-of-00132.safetensors", + "model.layers.2.self_attn.o_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.2.input_layernorm.weight": "model-00029-of-00132.safetensors", + "model.layers.2.self_attn.q_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.2.self_attn.k_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.2.self_attn.v_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.2.self_attn.k_norm.weight": "model-00029-of-00132.safetensors", + "model.layers.3.self_attn.o_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.3.input_layernorm.weight": "model-00029-of-00132.safetensors", + "model.layers.3.self_attn.q_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.3.self_attn.k_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.3.self_attn.v_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.3.self_attn.k_norm.weight": "model-00029-of-00132.safetensors", + "model.layers.3.mlp.gate.weight": "model-00029-of-00132.safetensors", + "model.layers.3.mlp.gate.e_score_correction_bias": "model-00029-of-00132.safetensors", + "model.layers.3.mlp.shared_experts.down_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.4.input_layernorm.weight": "model-00029-of-00132.safetensors", + "model.layers.4.self_attn.q_proj.bias": "model-00029-of-00132.safetensors", + "model.layers.4.self_attn.k_proj.bias": "model-00029-of-00132.safetensors", + "model.layers.4.self_attn.v_proj.bias": "model-00029-of-00132.safetensors", + "model.layers.4.self_attn.k_norm.weight": "model-00029-of-00132.safetensors", + "model.layers.5.self_attn.o_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.5.input_layernorm.weight": "model-00029-of-00132.safetensors", + "model.layers.5.self_attn.q_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.5.self_attn.k_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.5.self_attn.v_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.5.self_attn.k_norm.weight": "model-00029-of-00132.safetensors", + "model.layers.5.mlp.gate.weight": "model-00029-of-00132.safetensors", + "model.layers.5.mlp.gate.e_score_correction_bias": "model-00029-of-00132.safetensors", + "model.layers.5.mlp.shared_experts.down_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.6.input_layernorm.weight": "model-00029-of-00132.safetensors", + "model.layers.6.self_attn.q_proj.bias": "model-00029-of-00132.safetensors", + "model.layers.6.self_attn.k_proj.bias": "model-00029-of-00132.safetensors", + "model.layers.6.self_attn.v_proj.bias": "model-00029-of-00132.safetensors", + "model.layers.6.self_attn.k_norm.weight": "model-00029-of-00132.safetensors", + "model.layers.7.self_attn.o_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.7.input_layernorm.weight": "model-00029-of-00132.safetensors", + "model.layers.7.self_attn.q_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.7.self_attn.k_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.7.self_attn.v_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.7.self_attn.k_norm.weight": "model-00029-of-00132.safetensors", + "model.layers.7.mlp.gate.weight": "model-00029-of-00132.safetensors", + "model.layers.7.mlp.gate.e_score_correction_bias": "model-00029-of-00132.safetensors", + "model.layers.7.mlp.shared_experts.down_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.8.input_layernorm.weight": "model-00029-of-00132.safetensors", + "model.layers.8.self_attn.q_proj.bias": "model-00029-of-00132.safetensors", + "model.layers.8.self_attn.k_proj.bias": "model-00029-of-00132.safetensors", + "model.layers.8.self_attn.v_proj.bias": "model-00029-of-00132.safetensors", + "model.layers.8.self_attn.k_norm.weight": "model-00029-of-00132.safetensors", + "model.layers.9.self_attn.o_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.9.input_layernorm.weight": "model-00029-of-00132.safetensors", + "model.layers.9.self_attn.q_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.9.self_attn.k_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.9.self_attn.v_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.9.self_attn.k_norm.weight": "model-00029-of-00132.safetensors", + "model.layers.9.mlp.gate.weight": "model-00029-of-00132.safetensors", + "model.layers.9.mlp.gate.e_score_correction_bias": "model-00029-of-00132.safetensors", + "model.layers.9.mlp.shared_experts.down_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.10.input_layernorm.weight": "model-00029-of-00132.safetensors", + "model.layers.10.self_attn.q_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.10.self_attn.k_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.10.self_attn.v_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.10.self_attn.k_norm.weight": "model-00029-of-00132.safetensors", + "model.layers.10.mlp.gate.e_score_correction_bias": "model-00029-of-00132.safetensors", + "model.layers.11.self_attn.o_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.11.input_layernorm.weight": "model-00029-of-00132.safetensors", + "model.layers.11.self_attn.q_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.11.self_attn.k_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.11.self_attn.v_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.11.self_attn.q_proj.bias": "model-00029-of-00132.safetensors", + "model.layers.11.self_attn.k_proj.bias": "model-00029-of-00132.safetensors", + "model.layers.11.self_attn.v_proj.bias": "model-00029-of-00132.safetensors", + "model.layers.11.self_attn.k_norm.weight": "model-00029-of-00132.safetensors", + "model.layers.11.mlp.gate.weight": "model-00029-of-00132.safetensors", + "model.layers.11.mlp.gate.e_score_correction_bias": "model-00029-of-00132.safetensors", + "model.layers.11.mlp.shared_experts.down_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.12.input_layernorm.weight": "model-00029-of-00132.safetensors", + "model.layers.12.self_attn.q_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.12.self_attn.k_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.12.self_attn.v_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.12.self_attn.k_norm.weight": "model-00029-of-00132.safetensors", + "model.layers.12.mlp.gate.e_score_correction_bias": "model-00029-of-00132.safetensors", + "model.layers.13.self_attn.o_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.13.input_layernorm.weight": "model-00029-of-00132.safetensors", + "model.layers.13.self_attn.q_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.13.self_attn.k_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.13.self_attn.v_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.13.self_attn.q_proj.bias": "model-00029-of-00132.safetensors", + "model.layers.13.self_attn.k_proj.bias": "model-00029-of-00132.safetensors", + "model.layers.13.self_attn.v_proj.bias": "model-00029-of-00132.safetensors", + "model.layers.13.self_attn.k_norm.weight": "model-00029-of-00132.safetensors", + "model.layers.13.mlp.gate.weight": "model-00029-of-00132.safetensors", + "model.layers.13.mlp.gate.e_score_correction_bias": "model-00029-of-00132.safetensors", + "model.layers.13.mlp.shared_experts.down_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.14.input_layernorm.weight": "model-00029-of-00132.safetensors", + "model.layers.14.self_attn.q_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.14.self_attn.k_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.14.self_attn.v_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.14.self_attn.k_norm.weight": "model-00029-of-00132.safetensors", + "model.layers.14.mlp.gate.e_score_correction_bias": "model-00029-of-00132.safetensors", + "model.layers.15.self_attn.o_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.15.input_layernorm.weight": "model-00029-of-00132.safetensors", + "model.layers.15.self_attn.q_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.15.self_attn.k_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.15.self_attn.v_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.15.self_attn.q_proj.bias": "model-00029-of-00132.safetensors", + "model.layers.15.self_attn.k_proj.bias": "model-00029-of-00132.safetensors", + "model.layers.15.self_attn.v_proj.bias": "model-00029-of-00132.safetensors", + "model.layers.15.self_attn.k_norm.weight": "model-00029-of-00132.safetensors", + "model.layers.15.mlp.gate.weight": "model-00029-of-00132.safetensors", + "model.layers.15.mlp.gate.e_score_correction_bias": "model-00029-of-00132.safetensors", + "model.layers.15.mlp.shared_experts.down_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.16.input_layernorm.weight": "model-00029-of-00132.safetensors", + "model.layers.16.self_attn.q_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.16.self_attn.k_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.16.self_attn.v_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.16.self_attn.k_norm.weight": "model-00029-of-00132.safetensors", + "model.layers.17.self_attn.o_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.17.input_layernorm.weight": "model-00029-of-00132.safetensors", + "model.layers.17.self_attn.q_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.17.self_attn.k_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.17.self_attn.v_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.17.self_attn.q_proj.bias": "model-00029-of-00132.safetensors", + "model.layers.17.self_attn.k_proj.bias": "model-00029-of-00132.safetensors", + "model.layers.17.self_attn.v_proj.bias": "model-00029-of-00132.safetensors", + "model.layers.17.self_attn.k_norm.weight": "model-00029-of-00132.safetensors", + "model.layers.17.mlp.gate.weight": "model-00029-of-00132.safetensors", + "model.layers.17.mlp.gate.e_score_correction_bias": "model-00029-of-00132.safetensors", + "model.layers.17.mlp.shared_experts.down_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.18.input_layernorm.weight": "model-00029-of-00132.safetensors", + "model.layers.18.self_attn.q_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.18.self_attn.k_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.18.self_attn.v_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.18.self_attn.k_norm.weight": "model-00029-of-00132.safetensors", + "model.layers.19.self_attn.o_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.19.input_layernorm.weight": "model-00029-of-00132.safetensors", + "model.layers.19.self_attn.q_proj.bias": "model-00029-of-00132.safetensors", + "model.layers.19.self_attn.k_proj.bias": "model-00029-of-00132.safetensors", + "model.layers.19.self_attn.v_proj.bias": "model-00029-of-00132.safetensors", + "model.layers.19.self_attn.k_norm.weight": "model-00029-of-00132.safetensors", + "model.layers.19.mlp.gate.weight": "model-00029-of-00132.safetensors", + "model.layers.19.mlp.gate.e_score_correction_bias": "model-00029-of-00132.safetensors", + "model.layers.19.mlp.shared_experts.down_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.20.input_layernorm.weight": "model-00029-of-00132.safetensors", + "model.layers.20.self_attn.q_proj.bias": "model-00029-of-00132.safetensors", + "model.layers.20.self_attn.k_proj.bias": "model-00029-of-00132.safetensors", + "model.layers.20.self_attn.v_proj.bias": "model-00029-of-00132.safetensors", + "model.layers.20.self_attn.k_norm.weight": "model-00029-of-00132.safetensors", + "model.layers.21.self_attn.o_proj.weight": "model-00029-of-00132.safetensors", + "model.layers.21.input_layernorm.weight": "model-00029-of-00132.safetensors", + "model.layers.21.self_attn.q_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.21.self_attn.k_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.21.self_attn.v_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.21.self_attn.k_norm.weight": "model-00030-of-00132.safetensors", + "model.layers.21.mlp.gate.weight": "model-00030-of-00132.safetensors", + "model.layers.21.mlp.gate.e_score_correction_bias": "model-00030-of-00132.safetensors", + "model.layers.21.mlp.shared_experts.down_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.22.input_layernorm.weight": "model-00030-of-00132.safetensors", + "model.layers.22.self_attn.q_proj.bias": "model-00030-of-00132.safetensors", + "model.layers.22.self_attn.k_proj.bias": "model-00030-of-00132.safetensors", + "model.layers.22.self_attn.v_proj.bias": "model-00030-of-00132.safetensors", + "model.layers.22.self_attn.k_norm.weight": "model-00030-of-00132.safetensors", + "model.layers.23.input_layernorm.weight": "model-00030-of-00132.safetensors", + "model.layers.23.self_attn.q_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.self_attn.k_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.self_attn.v_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.self_attn.q_proj.bias": "model-00030-of-00132.safetensors", + "model.layers.23.self_attn.k_proj.bias": "model-00030-of-00132.safetensors", + "model.layers.23.self_attn.v_proj.bias": "model-00030-of-00132.safetensors", + "model.layers.23.self_attn.q_norm.weight": "model-00030-of-00132.safetensors", + "model.layers.23.self_attn.k_norm.weight": "model-00030-of-00132.safetensors", + "model.layers.23.post_attention_layernorm.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.gate.e_score_correction_bias": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.0.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.0.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.1.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.1.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.2.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.2.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.3.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.3.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.4.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.4.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.5.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.5.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.6.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.6.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.7.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.7.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.8.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.8.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.9.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.9.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.10.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.10.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.11.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.11.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.12.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.12.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.13.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.13.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.14.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.14.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.15.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.15.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.16.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.16.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.17.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.17.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.18.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.18.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.19.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.19.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.20.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.20.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.21.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.21.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.22.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.22.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.23.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.23.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.24.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.24.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.25.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.25.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.26.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.26.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.27.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.27.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.28.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.28.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.29.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.29.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.30.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.30.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.31.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.31.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.32.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.32.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.33.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.33.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.34.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.34.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.35.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.35.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.36.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.36.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.37.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.37.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.38.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.38.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.39.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.39.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.40.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.40.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.41.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.41.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.42.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.42.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.43.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.43.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.44.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.44.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.45.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.45.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.46.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.46.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.47.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.47.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.48.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.48.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.49.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.49.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.50.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.50.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.51.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.51.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.52.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.52.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.53.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.53.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.54.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.54.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.55.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.55.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.56.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.56.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.57.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.57.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.58.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.58.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.59.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.59.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.60.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.60.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.61.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.61.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.62.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.62.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.63.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.63.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.64.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.64.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.65.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.65.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.66.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.66.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.67.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.67.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.68.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.68.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.69.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.69.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.70.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.70.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.71.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.71.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.72.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.72.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.73.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.73.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.74.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.74.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.75.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.75.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.76.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.76.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.77.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.77.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.78.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.78.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.79.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.79.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.80.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.80.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.81.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.81.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.82.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.82.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.83.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.83.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.84.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.84.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.85.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.85.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.86.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.86.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.87.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.87.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.88.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.88.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.89.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.89.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.90.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.90.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.91.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.91.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.92.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.92.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.93.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.93.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.94.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.94.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.95.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.95.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.96.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.96.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.97.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.97.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.98.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.98.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.99.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.99.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.100.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.100.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.101.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.101.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.102.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.102.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.103.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.103.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.104.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.104.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.105.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.105.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.106.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.106.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.107.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.107.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.108.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.108.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.109.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.109.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.110.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.110.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.111.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.111.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.112.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.112.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.113.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.113.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.114.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.114.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.115.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.115.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.116.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.116.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.117.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.117.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.118.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.118.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.119.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.119.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.120.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.120.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.121.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.121.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.122.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.122.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.123.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.123.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.124.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.124.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.125.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.125.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.126.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.126.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.127.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.127.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.128.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.128.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.129.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.129.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.130.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.130.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.131.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.131.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.132.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.132.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.133.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.133.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.134.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.134.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.135.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.135.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.136.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.136.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.137.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.137.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.138.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.138.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.139.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.139.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.140.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.140.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.141.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.141.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.142.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.142.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.143.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.143.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.144.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.144.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.145.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.145.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.146.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.146.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.147.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.147.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.148.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.148.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.149.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.149.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.150.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.150.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.151.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.151.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.152.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.152.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.153.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.153.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.154.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.154.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.155.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.155.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.156.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.156.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.157.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.157.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.158.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.158.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.159.gate_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.159.up_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.0.down_proj.weight": "model-00030-of-00132.safetensors", + "model.layers.23.mlp.experts.1.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.2.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.3.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.4.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.5.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.6.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.7.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.8.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.9.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.10.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.11.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.12.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.13.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.14.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.15.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.16.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.17.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.18.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.19.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.20.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.21.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.22.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.23.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.24.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.25.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.26.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.27.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.28.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.29.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.30.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.31.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.32.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.33.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.34.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.35.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.36.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.37.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.38.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.39.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.40.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.41.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.42.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.43.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.44.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.45.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.46.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.47.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.48.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.49.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.50.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.51.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.52.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.53.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.54.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.55.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.56.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.57.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.58.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.59.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.60.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.61.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.62.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.63.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.64.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.65.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.66.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.67.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.68.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.69.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.70.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.71.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.72.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.73.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.74.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.75.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.76.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.77.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.78.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.79.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.80.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.81.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.82.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.83.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.84.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.85.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.86.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.87.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.88.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.89.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.90.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.91.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.92.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.93.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.94.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.95.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.96.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.97.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.98.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.99.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.100.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.101.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.102.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.103.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.104.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.105.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.106.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.107.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.108.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.109.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.110.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.111.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.112.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.113.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.114.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.115.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.116.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.117.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.118.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.119.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.120.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.121.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.122.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.123.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.124.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.125.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.126.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.127.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.128.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.129.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.130.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.131.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.132.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.133.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.134.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.135.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.136.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.137.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.138.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.139.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.140.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.141.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.142.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.143.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.144.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.145.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.146.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.147.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.148.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.149.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.150.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.151.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.152.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.153.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.154.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.155.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.156.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.157.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.158.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.experts.159.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.23.mlp.shared_experts.down_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.input_layernorm.weight": "model-00031-of-00132.safetensors", + "model.layers.24.self_attn.q_proj.bias": "model-00031-of-00132.safetensors", + "model.layers.24.self_attn.k_proj.bias": "model-00031-of-00132.safetensors", + "model.layers.24.self_attn.v_proj.bias": "model-00031-of-00132.safetensors", + "model.layers.24.self_attn.q_norm.weight": "model-00031-of-00132.safetensors", + "model.layers.24.self_attn.k_norm.weight": "model-00031-of-00132.safetensors", + "model.layers.24.post_attention_layernorm.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.gate.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.gate.e_score_correction_bias": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.0.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.0.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.1.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.1.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.2.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.2.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.3.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.3.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.4.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.4.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.5.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.5.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.6.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.6.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.7.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.7.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.8.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.8.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.9.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.9.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.10.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.10.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.11.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.11.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.12.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.12.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.13.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.13.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.14.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.14.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.15.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.15.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.16.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.16.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.17.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.17.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.18.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.18.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.19.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.19.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.20.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.20.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.21.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.21.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.22.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.22.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.23.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.23.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.24.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.24.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.25.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.25.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.26.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.26.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.27.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.27.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.28.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.28.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.29.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.29.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.30.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.30.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.31.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.31.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.32.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.32.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.33.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.33.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.34.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.34.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.35.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.35.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.36.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.36.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.37.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.37.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.38.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.38.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.39.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.39.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.40.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.40.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.41.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.41.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.42.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.42.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.43.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.43.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.44.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.44.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.45.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.45.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.46.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.46.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.47.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.47.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.48.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.48.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.49.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.49.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.50.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.50.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.51.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.51.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.52.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.52.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.53.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.53.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.54.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.54.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.55.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.55.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.56.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.56.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.57.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.57.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.58.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.58.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.59.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.59.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.60.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.60.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.61.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.61.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.62.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.62.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.63.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.63.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.64.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.64.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.65.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.65.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.66.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.66.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.67.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.67.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.68.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.68.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.69.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.69.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.70.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.70.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.71.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.71.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.72.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.72.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.73.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.73.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.74.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.74.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.75.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.75.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.76.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.76.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.77.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.77.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.78.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.78.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.79.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.79.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.80.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.80.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.81.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.81.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.82.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.82.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.83.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.83.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.84.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.84.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.85.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.85.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.86.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.86.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.87.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.87.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.88.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.88.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.89.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.89.up_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.90.gate_proj.weight": "model-00031-of-00132.safetensors", + "model.layers.24.mlp.experts.90.up_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.91.gate_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.91.up_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.92.gate_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.92.up_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.93.gate_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.93.up_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.94.gate_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.94.up_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.95.gate_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.95.up_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.96.gate_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.96.up_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.97.gate_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.97.up_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.98.gate_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.98.up_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.99.gate_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.99.up_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.100.gate_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.100.up_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.101.gate_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.101.up_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.102.gate_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.102.up_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.103.gate_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.103.up_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.104.gate_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.104.up_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.105.gate_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.105.up_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.106.gate_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.106.up_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.107.gate_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.107.up_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.108.gate_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.108.up_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.109.gate_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.109.up_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.110.gate_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.110.up_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.111.gate_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.111.up_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.112.gate_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.112.up_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.113.gate_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.113.up_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.114.gate_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.114.up_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.115.gate_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.115.up_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.116.gate_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.116.up_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.117.gate_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.117.up_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.118.gate_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.118.up_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.119.gate_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.119.up_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.120.gate_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.120.up_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.121.gate_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.121.up_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.122.gate_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.122.up_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.123.gate_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.123.up_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.124.gate_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.124.up_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.125.gate_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.125.up_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.126.gate_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.126.up_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.127.gate_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.127.up_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.128.gate_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.128.up_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.129.gate_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.129.up_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.130.gate_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.130.up_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.131.gate_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.131.up_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.132.gate_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.132.up_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.133.gate_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.133.up_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.134.gate_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.134.up_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.135.gate_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.135.up_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.136.gate_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.136.up_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.137.gate_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.137.up_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.138.gate_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.138.up_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.139.gate_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.139.up_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.140.gate_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.140.up_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.141.gate_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.141.up_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.142.gate_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.142.up_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.143.gate_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.143.up_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.144.gate_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.144.up_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.145.gate_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.145.up_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.146.gate_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.146.up_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.147.gate_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.147.up_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.148.gate_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.148.up_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.149.gate_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.149.up_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.150.gate_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.150.up_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.151.gate_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.151.up_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.152.gate_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.152.up_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.153.gate_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.153.up_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.154.gate_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.154.up_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.155.gate_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.155.up_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.156.gate_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.156.up_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.157.gate_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.157.up_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.158.gate_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.158.up_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.159.gate_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.159.up_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.0.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.1.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.2.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.3.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.4.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.5.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.6.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.7.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.8.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.9.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.10.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.11.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.12.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.13.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.14.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.15.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.16.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.17.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.18.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.19.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.20.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.21.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.22.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.23.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.24.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.25.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.26.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.27.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.28.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.29.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.30.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.31.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.32.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.33.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.34.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.35.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.36.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.37.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.38.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.39.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.40.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.41.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.42.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.43.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.44.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.45.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.46.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.47.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.48.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.49.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.50.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.51.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.52.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.53.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.54.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.55.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.56.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.57.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.58.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.59.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.60.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.61.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.62.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.63.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.64.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.65.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.66.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.67.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.68.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.69.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.70.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.71.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.72.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.73.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.74.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.75.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.76.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.77.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.78.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.79.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.80.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.81.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.82.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.83.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.84.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.85.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.86.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.87.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.88.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.89.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.90.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.91.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.92.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.93.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.94.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.95.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.96.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.97.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.98.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.99.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.100.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.101.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.102.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.103.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.104.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.105.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.106.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.107.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.108.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.109.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.110.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.111.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.112.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.113.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.114.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.115.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.116.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.117.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.118.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.119.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.120.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.121.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.122.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.123.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.124.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.125.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.126.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.127.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.128.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.129.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.130.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.131.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.132.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.133.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.134.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.135.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.136.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.137.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.138.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.139.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.140.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.141.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.142.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.143.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.144.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.145.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.146.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.147.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.148.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.149.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.150.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.151.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.152.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.153.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.154.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.155.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.156.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.157.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.158.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.experts.159.down_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.shared_experts.gate_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.24.mlp.shared_experts.up_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.25.self_attn.o_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.25.input_layernorm.weight": "model-00032-of-00132.safetensors", + "model.layers.25.self_attn.q_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.25.self_attn.k_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.25.self_attn.v_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.25.self_attn.q_proj.bias": "model-00032-of-00132.safetensors", + "model.layers.25.self_attn.k_proj.bias": "model-00032-of-00132.safetensors", + "model.layers.25.self_attn.v_proj.bias": "model-00032-of-00132.safetensors", + "model.layers.25.self_attn.q_norm.weight": "model-00032-of-00132.safetensors", + "model.layers.25.self_attn.k_norm.weight": "model-00032-of-00132.safetensors", + "model.layers.25.post_attention_layernorm.weight": "model-00032-of-00132.safetensors", + "model.layers.25.mlp.gate.e_score_correction_bias": "model-00032-of-00132.safetensors", + "model.layers.25.mlp.experts.0.gate_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.25.mlp.experts.0.up_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.25.mlp.experts.1.gate_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.25.mlp.experts.1.up_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.25.mlp.experts.2.gate_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.25.mlp.experts.2.up_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.25.mlp.experts.3.gate_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.25.mlp.experts.3.up_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.25.mlp.experts.4.gate_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.25.mlp.experts.4.up_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.25.mlp.experts.5.gate_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.25.mlp.experts.5.up_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.25.mlp.experts.6.gate_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.25.mlp.experts.6.up_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.25.mlp.experts.7.gate_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.25.mlp.experts.7.up_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.25.mlp.experts.8.gate_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.25.mlp.experts.8.up_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.25.mlp.experts.9.gate_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.25.mlp.experts.9.up_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.25.mlp.experts.10.gate_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.25.mlp.experts.10.up_proj.weight": "model-00032-of-00132.safetensors", + "model.layers.25.mlp.experts.11.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.11.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.12.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.12.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.13.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.13.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.14.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.14.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.15.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.15.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.16.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.16.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.17.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.17.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.18.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.18.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.19.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.19.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.20.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.20.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.21.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.21.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.22.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.22.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.23.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.23.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.24.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.24.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.25.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.25.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.26.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.26.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.27.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.27.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.28.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.28.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.29.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.29.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.30.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.30.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.31.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.31.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.32.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.32.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.33.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.33.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.34.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.34.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.35.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.35.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.36.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.36.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.37.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.37.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.38.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.38.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.39.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.39.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.40.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.40.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.41.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.41.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.42.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.42.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.43.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.43.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.44.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.44.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.45.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.45.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.46.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.46.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.47.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.47.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.48.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.48.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.49.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.49.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.50.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.50.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.51.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.51.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.52.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.52.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.53.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.53.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.54.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.54.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.55.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.55.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.56.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.56.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.57.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.57.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.58.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.58.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.59.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.59.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.60.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.60.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.61.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.61.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.62.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.62.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.63.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.63.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.64.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.64.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.65.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.65.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.66.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.66.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.67.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.67.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.68.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.68.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.69.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.69.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.70.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.70.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.71.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.71.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.72.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.72.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.73.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.73.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.74.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.74.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.75.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.75.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.76.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.76.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.77.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.77.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.78.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.78.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.79.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.79.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.80.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.80.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.81.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.81.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.82.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.82.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.83.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.83.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.84.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.84.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.85.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.85.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.86.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.86.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.87.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.87.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.88.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.88.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.89.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.89.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.90.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.90.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.91.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.91.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.92.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.92.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.93.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.93.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.94.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.94.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.95.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.95.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.96.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.96.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.97.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.97.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.98.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.98.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.99.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.99.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.100.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.100.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.101.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.101.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.102.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.102.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.103.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.103.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.104.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.104.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.105.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.105.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.106.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.106.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.107.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.107.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.108.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.108.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.109.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.109.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.110.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.110.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.111.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.111.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.112.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.112.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.113.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.113.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.114.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.114.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.115.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.115.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.116.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.116.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.117.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.117.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.118.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.118.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.119.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.119.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.120.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.120.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.121.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.121.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.122.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.122.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.123.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.123.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.124.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.124.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.125.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.125.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.126.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.126.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.127.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.127.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.128.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.128.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.129.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.129.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.130.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.130.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.131.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.131.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.132.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.132.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.133.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.133.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.134.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.134.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.135.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.135.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.136.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.136.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.137.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.137.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.138.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.138.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.139.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.139.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.140.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.140.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.141.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.141.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.142.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.142.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.143.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.143.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.144.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.144.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.145.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.145.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.146.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.146.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.147.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.147.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.148.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.148.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.149.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.149.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.150.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.150.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.151.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.151.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.152.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.152.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.153.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.153.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.154.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.154.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.155.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.155.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.156.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.156.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.157.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.157.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.158.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.158.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.159.gate_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.159.up_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.0.down_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.1.down_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.2.down_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.3.down_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.4.down_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.5.down_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.6.down_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.7.down_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.8.down_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.9.down_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.10.down_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.11.down_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.12.down_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.13.down_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.14.down_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.15.down_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.16.down_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.17.down_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.18.down_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.19.down_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.20.down_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.21.down_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.22.down_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.23.down_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.24.down_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.25.down_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.26.down_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.27.down_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.28.down_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.29.down_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.30.down_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.31.down_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.32.down_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.33.down_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.34.down_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.35.down_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.36.down_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.37.down_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.38.down_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.39.down_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.40.down_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.41.down_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.42.down_proj.weight": "model-00033-of-00132.safetensors", + "model.layers.25.mlp.experts.43.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.44.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.45.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.46.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.47.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.48.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.49.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.50.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.51.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.52.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.53.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.54.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.55.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.56.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.57.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.58.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.59.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.60.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.61.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.62.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.63.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.64.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.65.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.66.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.67.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.68.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.69.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.70.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.71.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.72.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.73.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.74.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.75.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.76.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.77.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.78.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.79.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.80.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.81.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.82.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.83.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.84.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.85.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.86.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.87.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.88.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.89.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.90.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.91.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.92.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.93.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.94.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.95.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.96.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.97.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.98.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.99.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.100.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.101.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.102.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.103.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.104.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.105.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.106.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.107.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.108.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.109.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.110.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.111.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.112.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.113.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.114.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.115.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.116.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.117.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.118.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.119.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.120.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.121.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.122.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.123.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.124.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.125.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.126.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.127.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.128.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.129.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.130.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.131.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.132.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.133.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.134.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.135.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.136.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.137.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.138.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.139.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.140.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.141.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.142.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.143.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.144.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.145.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.146.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.147.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.148.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.149.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.150.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.151.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.152.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.153.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.154.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.155.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.156.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.157.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.158.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.experts.159.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.shared_experts.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.shared_experts.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.25.mlp.shared_experts.down_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.input_layernorm.weight": "model-00034-of-00132.safetensors", + "model.layers.26.self_attn.q_proj.bias": "model-00034-of-00132.safetensors", + "model.layers.26.self_attn.k_proj.bias": "model-00034-of-00132.safetensors", + "model.layers.26.self_attn.v_proj.bias": "model-00034-of-00132.safetensors", + "model.layers.26.self_attn.q_norm.weight": "model-00034-of-00132.safetensors", + "model.layers.26.self_attn.k_norm.weight": "model-00034-of-00132.safetensors", + "model.layers.26.post_attention_layernorm.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.gate.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.gate.e_score_correction_bias": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.0.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.0.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.1.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.1.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.2.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.2.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.3.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.3.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.4.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.4.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.5.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.5.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.6.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.6.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.7.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.7.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.8.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.8.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.9.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.9.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.10.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.10.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.11.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.11.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.12.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.12.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.13.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.13.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.14.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.14.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.15.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.15.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.16.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.16.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.17.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.17.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.18.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.18.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.19.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.19.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.20.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.20.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.21.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.21.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.22.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.22.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.23.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.23.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.24.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.24.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.25.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.25.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.26.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.26.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.27.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.27.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.28.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.28.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.29.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.29.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.30.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.30.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.31.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.31.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.32.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.32.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.33.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.33.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.34.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.34.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.35.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.35.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.36.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.36.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.37.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.37.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.38.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.38.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.39.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.39.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.40.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.40.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.41.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.41.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.42.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.42.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.43.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.43.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.44.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.44.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.45.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.45.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.46.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.46.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.47.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.47.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.48.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.48.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.49.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.49.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.50.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.50.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.51.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.51.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.52.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.52.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.53.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.53.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.54.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.54.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.55.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.55.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.56.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.56.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.57.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.57.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.58.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.58.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.59.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.59.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.60.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.60.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.61.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.61.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.62.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.62.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.63.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.63.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.64.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.64.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.65.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.65.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.66.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.66.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.67.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.67.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.68.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.68.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.69.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.69.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.70.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.70.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.71.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.71.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.72.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.72.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.73.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.73.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.74.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.74.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.75.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.75.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.76.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.76.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.77.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.77.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.78.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.78.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.79.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.79.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.80.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.80.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.81.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.81.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.82.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.82.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.83.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.83.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.84.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.84.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.85.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.85.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.86.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.86.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.87.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.87.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.88.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.88.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.89.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.89.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.90.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.90.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.91.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.91.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.92.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.92.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.93.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.93.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.94.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.94.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.95.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.95.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.96.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.96.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.97.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.97.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.98.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.98.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.99.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.99.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.100.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.100.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.101.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.101.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.102.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.102.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.103.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.103.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.104.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.104.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.105.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.105.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.106.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.106.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.107.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.107.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.108.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.108.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.109.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.109.up_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.110.gate_proj.weight": "model-00034-of-00132.safetensors", + "model.layers.26.mlp.experts.110.up_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.111.gate_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.111.up_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.112.gate_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.112.up_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.113.gate_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.113.up_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.114.gate_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.114.up_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.115.gate_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.115.up_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.116.gate_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.116.up_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.117.gate_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.117.up_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.118.gate_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.118.up_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.119.gate_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.119.up_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.120.gate_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.120.up_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.121.gate_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.121.up_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.122.gate_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.122.up_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.123.gate_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.123.up_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.124.gate_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.124.up_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.125.gate_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.125.up_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.126.gate_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.126.up_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.127.gate_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.127.up_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.128.gate_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.128.up_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.129.gate_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.129.up_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.130.gate_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.130.up_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.131.gate_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.131.up_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.132.gate_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.132.up_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.133.gate_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.133.up_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.134.gate_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.134.up_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.135.gate_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.135.up_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.136.gate_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.136.up_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.137.gate_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.137.up_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.138.gate_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.138.up_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.139.gate_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.139.up_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.140.gate_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.140.up_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.141.gate_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.141.up_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.142.gate_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.142.up_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.143.gate_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.143.up_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.144.gate_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.144.up_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.145.gate_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.145.up_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.146.gate_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.146.up_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.147.gate_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.147.up_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.148.gate_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.148.up_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.149.gate_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.149.up_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.150.gate_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.150.up_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.151.gate_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.151.up_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.152.gate_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.152.up_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.153.gate_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.153.up_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.154.gate_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.154.up_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.155.gate_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.155.up_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.156.gate_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.156.up_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.157.gate_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.157.up_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.158.gate_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.158.up_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.159.gate_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.159.up_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.0.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.1.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.2.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.3.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.4.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.5.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.6.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.7.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.8.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.9.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.10.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.11.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.12.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.13.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.14.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.15.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.16.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.17.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.18.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.19.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.20.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.21.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.22.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.23.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.24.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.25.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.26.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.27.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.28.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.29.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.30.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.31.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.32.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.33.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.34.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.35.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.36.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.37.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.38.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.39.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.40.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.41.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.42.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.43.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.44.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.45.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.46.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.47.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.48.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.49.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.50.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.51.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.52.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.53.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.54.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.55.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.56.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.57.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.58.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.59.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.60.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.61.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.62.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.63.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.64.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.65.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.66.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.67.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.68.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.69.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.70.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.71.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.72.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.73.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.74.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.75.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.76.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.77.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.78.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.79.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.80.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.81.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.82.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.83.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.84.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.85.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.86.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.87.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.88.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.89.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.90.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.91.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.92.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.93.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.94.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.95.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.96.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.97.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.98.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.99.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.100.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.101.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.102.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.103.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.104.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.105.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.106.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.107.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.108.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.109.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.110.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.111.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.112.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.113.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.114.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.115.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.116.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.117.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.118.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.119.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.120.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.121.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.122.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.123.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.124.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.125.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.126.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.127.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.128.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.129.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.130.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.131.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.132.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.133.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.134.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.135.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.136.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.137.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.138.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.139.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.140.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.141.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.142.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.143.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.144.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.145.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.146.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.147.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.148.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.149.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.150.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.151.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.152.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.153.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.154.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.155.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.156.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.157.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.158.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.experts.159.down_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.shared_experts.gate_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.26.mlp.shared_experts.up_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.27.self_attn.o_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.27.input_layernorm.weight": "model-00035-of-00132.safetensors", + "model.layers.27.self_attn.q_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.27.self_attn.k_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.27.self_attn.v_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.27.self_attn.q_proj.bias": "model-00035-of-00132.safetensors", + "model.layers.27.self_attn.k_proj.bias": "model-00035-of-00132.safetensors", + "model.layers.27.self_attn.v_proj.bias": "model-00035-of-00132.safetensors", + "model.layers.27.self_attn.q_norm.weight": "model-00035-of-00132.safetensors", + "model.layers.27.self_attn.k_norm.weight": "model-00035-of-00132.safetensors", + "model.layers.27.post_attention_layernorm.weight": "model-00035-of-00132.safetensors", + "model.layers.27.mlp.gate.e_score_correction_bias": "model-00035-of-00132.safetensors", + "model.layers.27.mlp.experts.0.gate_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.27.mlp.experts.0.up_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.27.mlp.experts.1.gate_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.27.mlp.experts.1.up_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.27.mlp.experts.2.gate_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.27.mlp.experts.2.up_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.27.mlp.experts.3.gate_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.27.mlp.experts.3.up_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.27.mlp.experts.4.gate_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.27.mlp.experts.4.up_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.27.mlp.experts.5.gate_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.27.mlp.experts.5.up_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.27.mlp.experts.6.gate_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.27.mlp.experts.6.up_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.27.mlp.experts.7.gate_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.27.mlp.experts.7.up_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.27.mlp.experts.8.gate_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.27.mlp.experts.8.up_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.27.mlp.experts.9.gate_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.27.mlp.experts.9.up_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.27.mlp.experts.10.gate_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.27.mlp.experts.10.up_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.27.mlp.experts.11.gate_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.27.mlp.experts.11.up_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.27.mlp.experts.12.gate_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.27.mlp.experts.12.up_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.27.mlp.experts.13.gate_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.27.mlp.experts.13.up_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.27.mlp.experts.14.gate_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.27.mlp.experts.14.up_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.27.mlp.experts.15.gate_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.27.mlp.experts.15.up_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.27.mlp.experts.16.gate_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.27.mlp.experts.16.up_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.27.mlp.experts.17.gate_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.27.mlp.experts.17.up_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.27.mlp.experts.18.gate_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.27.mlp.experts.18.up_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.27.mlp.experts.19.gate_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.27.mlp.experts.19.up_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.27.mlp.experts.20.gate_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.27.mlp.experts.20.up_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.27.mlp.experts.21.gate_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.27.mlp.experts.21.up_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.27.mlp.experts.22.gate_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.27.mlp.experts.22.up_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.27.mlp.experts.23.gate_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.27.mlp.experts.23.up_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.27.mlp.experts.24.gate_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.27.mlp.experts.24.up_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.27.mlp.experts.25.gate_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.27.mlp.experts.25.up_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.27.mlp.experts.26.gate_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.27.mlp.experts.26.up_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.27.mlp.experts.27.gate_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.27.mlp.experts.27.up_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.27.mlp.experts.28.gate_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.27.mlp.experts.28.up_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.27.mlp.experts.29.gate_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.27.mlp.experts.29.up_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.27.mlp.experts.30.gate_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.27.mlp.experts.30.up_proj.weight": "model-00035-of-00132.safetensors", + "model.layers.27.mlp.experts.31.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.31.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.32.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.32.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.33.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.33.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.34.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.34.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.35.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.35.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.36.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.36.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.37.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.37.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.38.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.38.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.39.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.39.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.40.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.40.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.41.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.41.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.42.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.42.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.43.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.43.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.44.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.44.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.45.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.45.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.46.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.46.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.47.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.47.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.48.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.48.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.49.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.49.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.50.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.50.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.51.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.51.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.52.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.52.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.53.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.53.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.54.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.54.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.55.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.55.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.56.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.56.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.57.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.57.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.58.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.58.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.59.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.59.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.60.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.60.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.61.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.61.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.62.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.62.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.63.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.63.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.64.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.64.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.65.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.65.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.66.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.66.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.67.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.67.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.68.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.68.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.69.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.69.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.70.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.70.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.71.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.71.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.72.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.72.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.73.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.73.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.74.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.74.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.75.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.75.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.76.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.76.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.77.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.77.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.78.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.78.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.79.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.79.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.80.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.80.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.81.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.81.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.82.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.82.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.83.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.83.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.84.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.84.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.85.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.85.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.86.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.86.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.87.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.87.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.88.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.88.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.89.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.89.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.90.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.90.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.91.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.91.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.92.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.92.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.93.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.93.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.94.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.94.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.95.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.95.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.96.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.96.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.97.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.97.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.98.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.98.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.99.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.99.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.100.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.100.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.101.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.101.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.102.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.102.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.103.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.103.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.104.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.104.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.105.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.105.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.106.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.106.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.107.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.107.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.108.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.108.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.109.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.109.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.110.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.110.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.111.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.111.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.112.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.112.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.113.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.113.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.114.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.114.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.115.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.115.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.116.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.116.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.117.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.117.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.118.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.118.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.119.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.119.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.120.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.120.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.121.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.121.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.122.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.122.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.123.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.123.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.124.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.124.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.125.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.125.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.126.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.126.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.127.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.127.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.128.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.128.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.129.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.129.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.130.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.130.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.131.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.131.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.132.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.132.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.133.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.133.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.134.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.134.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.135.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.135.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.136.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.136.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.137.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.137.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.138.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.138.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.139.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.139.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.140.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.140.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.141.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.141.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.142.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.142.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.143.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.143.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.144.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.144.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.145.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.145.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.146.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.146.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.147.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.147.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.148.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.148.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.149.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.149.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.150.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.150.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.151.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.151.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.152.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.152.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.153.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.153.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.154.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.154.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.155.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.155.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.156.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.156.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.157.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.157.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.158.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.158.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.159.gate_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.159.up_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.0.down_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.1.down_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.2.down_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.3.down_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.4.down_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.5.down_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.6.down_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.7.down_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.8.down_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.9.down_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.10.down_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.11.down_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.12.down_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.13.down_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.14.down_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.15.down_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.16.down_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.17.down_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.18.down_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.19.down_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.20.down_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.21.down_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.22.down_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.23.down_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.24.down_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.25.down_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.26.down_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.27.down_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.28.down_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.29.down_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.30.down_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.31.down_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.32.down_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.33.down_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.34.down_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.35.down_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.36.down_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.37.down_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.38.down_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.39.down_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.40.down_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.41.down_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.42.down_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.43.down_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.44.down_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.45.down_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.46.down_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.47.down_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.48.down_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.49.down_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.50.down_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.51.down_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.52.down_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.53.down_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.54.down_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.55.down_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.56.down_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.57.down_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.58.down_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.59.down_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.60.down_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.61.down_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.62.down_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.63.down_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.64.down_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.65.down_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.66.down_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.67.down_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.68.down_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.69.down_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.70.down_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.71.down_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.72.down_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.73.down_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.74.down_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.75.down_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.76.down_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.77.down_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.78.down_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.79.down_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.80.down_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.81.down_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.82.down_proj.weight": "model-00036-of-00132.safetensors", + "model.layers.27.mlp.experts.83.down_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.27.mlp.experts.84.down_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.27.mlp.experts.85.down_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.27.mlp.experts.86.down_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.27.mlp.experts.87.down_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.27.mlp.experts.88.down_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.27.mlp.experts.89.down_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.27.mlp.experts.90.down_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.27.mlp.experts.91.down_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.27.mlp.experts.92.down_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.27.mlp.experts.93.down_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.27.mlp.experts.94.down_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.27.mlp.experts.95.down_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.27.mlp.experts.96.down_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.27.mlp.experts.97.down_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.27.mlp.experts.98.down_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.27.mlp.experts.99.down_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.27.mlp.experts.100.down_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.27.mlp.experts.101.down_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.27.mlp.experts.102.down_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.27.mlp.experts.103.down_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.27.mlp.experts.104.down_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.27.mlp.experts.105.down_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.27.mlp.experts.106.down_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.27.mlp.experts.107.down_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.27.mlp.experts.108.down_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.27.mlp.experts.109.down_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.27.mlp.experts.110.down_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.27.mlp.experts.111.down_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.27.mlp.experts.112.down_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.27.mlp.experts.113.down_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.27.mlp.experts.114.down_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.27.mlp.experts.115.down_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.27.mlp.experts.116.down_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.27.mlp.experts.117.down_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.27.mlp.experts.118.down_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.27.mlp.experts.119.down_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.27.mlp.experts.120.down_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.27.mlp.experts.121.down_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.27.mlp.experts.122.down_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.27.mlp.experts.123.down_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.27.mlp.experts.124.down_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.27.mlp.experts.125.down_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.27.mlp.experts.126.down_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.27.mlp.experts.127.down_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.27.mlp.experts.128.down_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.27.mlp.experts.129.down_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.27.mlp.experts.130.down_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.27.mlp.experts.131.down_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.27.mlp.experts.132.down_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.27.mlp.experts.133.down_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.27.mlp.experts.134.down_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.27.mlp.experts.135.down_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.27.mlp.experts.136.down_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.27.mlp.experts.137.down_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.27.mlp.experts.138.down_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.27.mlp.experts.139.down_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.27.mlp.experts.140.down_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.27.mlp.experts.141.down_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.27.mlp.experts.142.down_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.27.mlp.experts.143.down_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.27.mlp.experts.144.down_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.27.mlp.experts.145.down_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.27.mlp.experts.146.down_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.27.mlp.experts.147.down_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.27.mlp.experts.148.down_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.27.mlp.experts.149.down_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.27.mlp.experts.150.down_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.27.mlp.experts.151.down_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.27.mlp.experts.152.down_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.27.mlp.experts.153.down_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.27.mlp.experts.154.down_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.27.mlp.experts.155.down_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.27.mlp.experts.156.down_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.27.mlp.experts.157.down_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.27.mlp.experts.158.down_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.27.mlp.experts.159.down_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.27.mlp.shared_experts.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.27.mlp.shared_experts.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.27.mlp.shared_experts.down_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.input_layernorm.weight": "model-00037-of-00132.safetensors", + "model.layers.28.self_attn.q_proj.bias": "model-00037-of-00132.safetensors", + "model.layers.28.self_attn.k_proj.bias": "model-00037-of-00132.safetensors", + "model.layers.28.self_attn.v_proj.bias": "model-00037-of-00132.safetensors", + "model.layers.28.self_attn.q_norm.weight": "model-00037-of-00132.safetensors", + "model.layers.28.self_attn.k_norm.weight": "model-00037-of-00132.safetensors", + "model.layers.28.post_attention_layernorm.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.gate.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.gate.e_score_correction_bias": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.0.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.0.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.1.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.1.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.2.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.2.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.3.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.3.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.4.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.4.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.5.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.5.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.6.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.6.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.7.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.7.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.8.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.8.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.9.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.9.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.10.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.10.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.11.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.11.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.12.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.12.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.13.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.13.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.14.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.14.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.15.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.15.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.16.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.16.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.17.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.17.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.18.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.18.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.19.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.19.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.20.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.20.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.21.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.21.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.22.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.22.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.23.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.23.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.24.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.24.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.25.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.25.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.26.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.26.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.27.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.27.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.28.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.28.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.29.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.29.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.30.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.30.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.31.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.31.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.32.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.32.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.33.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.33.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.34.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.34.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.35.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.35.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.36.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.36.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.37.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.37.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.38.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.38.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.39.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.39.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.40.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.40.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.41.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.41.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.42.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.42.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.43.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.43.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.44.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.44.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.45.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.45.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.46.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.46.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.47.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.47.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.48.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.48.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.49.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.49.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.50.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.50.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.51.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.51.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.52.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.52.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.53.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.53.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.54.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.54.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.55.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.55.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.56.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.56.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.57.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.57.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.58.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.58.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.59.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.59.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.60.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.60.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.61.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.61.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.62.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.62.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.63.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.63.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.64.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.64.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.65.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.65.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.66.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.66.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.67.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.67.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.68.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.68.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.69.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.69.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.70.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.70.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.71.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.71.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.72.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.72.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.73.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.73.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.74.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.74.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.75.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.75.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.76.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.76.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.77.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.77.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.78.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.78.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.79.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.79.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.80.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.80.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.81.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.81.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.82.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.82.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.83.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.83.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.84.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.84.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.85.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.85.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.86.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.86.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.87.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.87.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.88.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.88.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.89.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.89.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.90.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.90.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.91.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.91.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.92.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.92.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.93.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.93.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.94.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.94.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.95.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.95.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.96.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.96.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.97.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.97.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.98.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.98.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.99.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.99.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.100.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.100.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.101.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.101.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.102.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.102.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.103.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.103.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.104.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.104.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.105.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.105.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.106.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.106.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.107.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.107.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.108.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.108.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.109.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.109.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.110.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.110.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.111.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.111.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.112.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.112.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.113.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.113.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.114.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.114.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.115.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.115.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.116.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.116.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.117.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.117.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.118.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.118.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.119.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.119.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.120.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.120.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.121.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.121.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.122.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.122.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.123.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.123.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.124.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.124.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.125.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.125.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.126.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.126.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.127.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.127.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.128.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.128.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.129.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.129.up_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.130.gate_proj.weight": "model-00037-of-00132.safetensors", + "model.layers.28.mlp.experts.130.up_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.131.gate_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.131.up_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.132.gate_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.132.up_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.133.gate_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.133.up_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.134.gate_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.134.up_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.135.gate_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.135.up_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.136.gate_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.136.up_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.137.gate_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.137.up_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.138.gate_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.138.up_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.139.gate_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.139.up_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.140.gate_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.140.up_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.141.gate_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.141.up_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.142.gate_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.142.up_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.143.gate_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.143.up_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.144.gate_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.144.up_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.145.gate_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.145.up_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.146.gate_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.146.up_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.147.gate_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.147.up_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.148.gate_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.148.up_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.149.gate_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.149.up_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.150.gate_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.150.up_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.151.gate_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.151.up_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.152.gate_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.152.up_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.153.gate_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.153.up_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.154.gate_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.154.up_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.155.gate_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.155.up_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.156.gate_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.156.up_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.157.gate_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.157.up_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.158.gate_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.158.up_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.159.gate_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.159.up_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.0.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.1.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.2.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.3.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.4.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.5.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.6.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.7.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.8.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.9.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.10.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.11.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.12.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.13.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.14.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.15.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.16.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.17.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.18.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.19.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.20.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.21.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.22.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.23.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.24.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.25.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.26.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.27.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.28.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.29.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.30.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.31.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.32.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.33.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.34.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.35.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.36.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.37.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.38.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.39.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.40.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.41.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.42.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.43.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.44.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.45.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.46.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.47.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.48.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.49.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.50.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.51.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.52.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.53.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.54.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.55.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.56.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.57.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.58.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.59.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.60.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.61.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.62.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.63.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.64.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.65.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.66.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.67.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.68.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.69.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.70.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.71.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.72.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.73.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.74.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.75.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.76.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.77.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.78.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.79.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.80.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.81.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.82.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.83.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.84.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.85.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.86.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.87.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.88.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.89.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.90.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.91.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.92.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.93.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.94.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.95.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.96.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.97.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.98.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.99.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.100.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.101.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.102.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.103.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.104.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.105.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.106.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.107.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.108.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.109.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.110.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.111.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.112.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.113.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.114.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.115.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.116.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.117.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.118.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.119.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.120.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.121.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.122.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.123.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.124.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.125.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.126.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.127.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.128.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.129.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.130.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.131.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.132.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.133.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.134.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.135.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.136.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.137.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.138.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.139.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.140.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.141.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.142.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.143.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.144.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.145.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.146.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.147.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.148.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.149.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.150.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.151.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.152.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.153.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.154.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.155.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.156.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.157.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.158.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.experts.159.down_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.shared_experts.gate_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.28.mlp.shared_experts.up_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.self_attn.o_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.input_layernorm.weight": "model-00038-of-00132.safetensors", + "model.layers.29.self_attn.q_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.self_attn.k_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.self_attn.v_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.self_attn.q_proj.bias": "model-00038-of-00132.safetensors", + "model.layers.29.self_attn.k_proj.bias": "model-00038-of-00132.safetensors", + "model.layers.29.self_attn.v_proj.bias": "model-00038-of-00132.safetensors", + "model.layers.29.self_attn.q_norm.weight": "model-00038-of-00132.safetensors", + "model.layers.29.self_attn.k_norm.weight": "model-00038-of-00132.safetensors", + "model.layers.29.post_attention_layernorm.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.gate.e_score_correction_bias": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.0.gate_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.0.up_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.1.gate_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.1.up_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.2.gate_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.2.up_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.3.gate_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.3.up_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.4.gate_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.4.up_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.5.gate_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.5.up_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.6.gate_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.6.up_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.7.gate_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.7.up_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.8.gate_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.8.up_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.9.gate_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.9.up_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.10.gate_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.10.up_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.11.gate_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.11.up_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.12.gate_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.12.up_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.13.gate_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.13.up_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.14.gate_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.14.up_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.15.gate_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.15.up_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.16.gate_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.16.up_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.17.gate_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.17.up_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.18.gate_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.18.up_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.19.gate_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.19.up_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.20.gate_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.20.up_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.21.gate_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.21.up_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.22.gate_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.22.up_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.23.gate_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.23.up_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.24.gate_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.24.up_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.25.gate_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.25.up_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.26.gate_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.26.up_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.27.gate_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.27.up_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.28.gate_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.28.up_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.29.gate_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.29.up_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.30.gate_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.30.up_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.31.gate_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.31.up_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.32.gate_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.32.up_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.33.gate_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.33.up_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.34.gate_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.34.up_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.35.gate_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.35.up_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.36.gate_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.36.up_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.37.gate_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.37.up_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.38.gate_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.38.up_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.39.gate_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.39.up_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.40.gate_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.40.up_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.41.gate_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.41.up_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.42.gate_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.42.up_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.43.gate_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.43.up_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.44.gate_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.44.up_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.45.gate_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.45.up_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.46.gate_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.46.up_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.47.gate_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.47.up_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.48.gate_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.48.up_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.49.gate_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.49.up_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.50.gate_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.50.up_proj.weight": "model-00038-of-00132.safetensors", + "model.layers.29.mlp.experts.51.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.51.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.52.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.52.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.53.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.53.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.54.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.54.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.55.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.55.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.56.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.56.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.57.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.57.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.58.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.58.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.59.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.59.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.60.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.60.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.61.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.61.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.62.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.62.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.63.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.63.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.64.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.64.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.65.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.65.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.66.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.66.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.67.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.67.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.68.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.68.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.69.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.69.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.70.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.70.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.71.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.71.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.72.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.72.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.73.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.73.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.74.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.74.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.75.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.75.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.76.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.76.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.77.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.77.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.78.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.78.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.79.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.79.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.80.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.80.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.81.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.81.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.82.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.82.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.83.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.83.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.84.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.84.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.85.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.85.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.86.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.86.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.87.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.87.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.88.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.88.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.89.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.89.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.90.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.90.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.91.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.91.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.92.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.92.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.93.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.93.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.94.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.94.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.95.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.95.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.96.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.96.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.97.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.97.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.98.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.98.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.99.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.99.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.100.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.100.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.101.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.101.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.102.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.102.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.103.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.103.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.104.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.104.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.105.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.105.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.106.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.106.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.107.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.107.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.108.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.108.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.109.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.109.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.110.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.110.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.111.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.111.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.112.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.112.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.113.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.113.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.114.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.114.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.115.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.115.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.116.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.116.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.117.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.117.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.118.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.118.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.119.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.119.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.120.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.120.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.121.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.121.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.122.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.122.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.123.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.123.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.124.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.124.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.125.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.125.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.126.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.126.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.127.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.127.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.128.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.128.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.129.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.129.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.130.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.130.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.131.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.131.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.132.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.132.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.133.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.133.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.134.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.134.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.135.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.135.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.136.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.136.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.137.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.137.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.138.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.138.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.139.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.139.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.140.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.140.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.141.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.141.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.142.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.142.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.143.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.143.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.144.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.144.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.145.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.145.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.146.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.146.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.147.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.147.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.148.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.148.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.149.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.149.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.150.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.150.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.151.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.151.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.152.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.152.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.153.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.153.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.154.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.154.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.155.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.155.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.156.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.156.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.157.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.157.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.158.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.158.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.159.gate_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.159.up_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.0.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.1.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.2.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.3.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.4.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.5.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.6.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.7.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.8.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.9.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.10.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.11.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.12.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.13.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.14.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.15.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.16.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.17.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.18.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.19.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.20.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.21.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.22.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.23.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.24.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.25.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.26.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.27.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.28.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.29.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.30.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.31.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.32.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.33.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.34.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.35.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.36.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.37.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.38.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.39.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.40.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.41.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.42.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.43.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.44.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.45.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.46.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.47.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.48.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.49.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.50.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.51.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.52.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.53.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.54.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.55.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.56.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.57.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.58.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.59.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.60.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.61.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.62.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.63.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.64.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.65.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.66.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.67.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.68.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.69.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.70.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.71.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.72.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.73.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.74.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.75.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.76.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.77.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.78.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.79.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.80.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.81.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.82.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.83.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.84.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.85.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.86.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.87.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.88.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.89.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.90.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.91.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.92.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.93.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.94.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.95.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.96.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.97.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.98.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.99.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.100.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.101.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.102.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.103.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.104.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.105.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.106.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.107.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.108.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.109.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.110.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.111.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.112.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.113.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.114.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.115.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.116.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.117.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.118.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.119.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.120.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.121.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.122.down_proj.weight": "model-00039-of-00132.safetensors", + "model.layers.29.mlp.experts.123.down_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.29.mlp.experts.124.down_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.29.mlp.experts.125.down_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.29.mlp.experts.126.down_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.29.mlp.experts.127.down_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.29.mlp.experts.128.down_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.29.mlp.experts.129.down_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.29.mlp.experts.130.down_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.29.mlp.experts.131.down_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.29.mlp.experts.132.down_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.29.mlp.experts.133.down_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.29.mlp.experts.134.down_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.29.mlp.experts.135.down_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.29.mlp.experts.136.down_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.29.mlp.experts.137.down_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.29.mlp.experts.138.down_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.29.mlp.experts.139.down_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.29.mlp.experts.140.down_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.29.mlp.experts.141.down_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.29.mlp.experts.142.down_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.29.mlp.experts.143.down_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.29.mlp.experts.144.down_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.29.mlp.experts.145.down_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.29.mlp.experts.146.down_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.29.mlp.experts.147.down_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.29.mlp.experts.148.down_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.29.mlp.experts.149.down_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.29.mlp.experts.150.down_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.29.mlp.experts.151.down_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.29.mlp.experts.152.down_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.29.mlp.experts.153.down_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.29.mlp.experts.154.down_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.29.mlp.experts.155.down_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.29.mlp.experts.156.down_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.29.mlp.experts.157.down_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.29.mlp.experts.158.down_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.29.mlp.experts.159.down_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.29.mlp.shared_experts.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.29.mlp.shared_experts.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.29.mlp.shared_experts.down_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.input_layernorm.weight": "model-00040-of-00132.safetensors", + "model.layers.30.self_attn.q_proj.bias": "model-00040-of-00132.safetensors", + "model.layers.30.self_attn.k_proj.bias": "model-00040-of-00132.safetensors", + "model.layers.30.self_attn.v_proj.bias": "model-00040-of-00132.safetensors", + "model.layers.30.self_attn.q_norm.weight": "model-00040-of-00132.safetensors", + "model.layers.30.self_attn.k_norm.weight": "model-00040-of-00132.safetensors", + "model.layers.30.post_attention_layernorm.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.gate.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.gate.e_score_correction_bias": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.0.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.0.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.1.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.1.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.2.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.2.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.3.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.3.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.4.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.4.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.5.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.5.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.6.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.6.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.7.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.7.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.8.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.8.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.9.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.9.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.10.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.10.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.11.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.11.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.12.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.12.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.13.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.13.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.14.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.14.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.15.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.15.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.16.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.16.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.17.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.17.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.18.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.18.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.19.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.19.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.20.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.20.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.21.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.21.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.22.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.22.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.23.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.23.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.24.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.24.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.25.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.25.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.26.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.26.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.27.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.27.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.28.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.28.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.29.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.29.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.30.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.30.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.31.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.31.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.32.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.32.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.33.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.33.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.34.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.34.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.35.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.35.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.36.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.36.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.37.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.37.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.38.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.38.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.39.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.39.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.40.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.40.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.41.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.41.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.42.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.42.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.43.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.43.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.44.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.44.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.45.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.45.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.46.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.46.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.47.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.47.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.48.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.48.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.49.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.49.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.50.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.50.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.51.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.51.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.52.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.52.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.53.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.53.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.54.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.54.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.55.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.55.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.56.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.56.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.57.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.57.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.58.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.58.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.59.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.59.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.60.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.60.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.61.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.61.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.62.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.62.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.63.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.63.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.64.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.64.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.65.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.65.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.66.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.66.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.67.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.67.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.68.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.68.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.69.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.69.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.70.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.70.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.71.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.71.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.72.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.72.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.73.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.73.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.74.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.74.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.75.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.75.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.76.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.76.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.77.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.77.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.78.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.78.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.79.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.79.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.80.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.80.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.81.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.81.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.82.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.82.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.83.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.83.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.84.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.84.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.85.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.85.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.86.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.86.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.87.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.87.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.88.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.88.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.89.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.89.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.90.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.90.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.91.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.91.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.92.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.92.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.93.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.93.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.94.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.94.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.95.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.95.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.96.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.96.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.97.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.97.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.98.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.98.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.99.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.99.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.100.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.100.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.101.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.101.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.102.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.102.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.103.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.103.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.104.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.104.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.105.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.105.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.106.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.106.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.107.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.107.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.108.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.108.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.109.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.109.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.110.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.110.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.111.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.111.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.112.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.112.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.113.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.113.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.114.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.114.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.115.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.115.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.116.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.116.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.117.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.117.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.118.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.118.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.119.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.119.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.120.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.120.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.121.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.121.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.122.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.122.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.123.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.123.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.124.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.124.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.125.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.125.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.126.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.126.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.127.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.127.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.128.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.128.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.129.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.129.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.130.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.130.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.131.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.131.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.132.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.132.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.133.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.133.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.134.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.134.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.135.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.135.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.136.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.136.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.137.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.137.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.138.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.138.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.139.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.139.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.140.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.140.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.141.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.141.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.142.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.142.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.143.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.143.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.144.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.144.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.145.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.145.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.146.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.146.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.147.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.147.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.148.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.148.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.149.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.149.up_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.150.gate_proj.weight": "model-00040-of-00132.safetensors", + "model.layers.30.mlp.experts.150.up_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.151.gate_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.151.up_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.152.gate_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.152.up_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.153.gate_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.153.up_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.154.gate_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.154.up_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.155.gate_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.155.up_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.156.gate_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.156.up_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.157.gate_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.157.up_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.158.gate_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.158.up_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.159.gate_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.159.up_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.0.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.1.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.2.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.3.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.4.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.5.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.6.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.7.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.8.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.9.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.10.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.11.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.12.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.13.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.14.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.15.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.16.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.17.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.18.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.19.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.20.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.21.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.22.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.23.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.24.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.25.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.26.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.27.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.28.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.29.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.30.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.31.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.32.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.33.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.34.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.35.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.36.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.37.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.38.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.39.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.40.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.41.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.42.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.43.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.44.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.45.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.46.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.47.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.48.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.49.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.50.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.51.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.52.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.53.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.54.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.55.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.56.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.57.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.58.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.59.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.60.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.61.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.62.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.63.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.64.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.65.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.66.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.67.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.68.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.69.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.70.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.71.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.72.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.73.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.74.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.75.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.76.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.77.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.78.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.79.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.80.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.81.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.82.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.83.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.84.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.85.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.86.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.87.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.88.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.89.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.90.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.91.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.92.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.93.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.94.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.95.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.96.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.97.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.98.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.99.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.100.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.101.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.102.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.103.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.104.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.105.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.106.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.107.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.108.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.109.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.110.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.111.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.112.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.113.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.114.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.115.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.116.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.117.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.118.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.119.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.120.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.121.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.122.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.123.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.124.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.125.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.126.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.127.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.128.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.129.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.130.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.131.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.132.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.133.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.134.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.135.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.136.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.137.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.138.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.139.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.140.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.141.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.142.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.143.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.144.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.145.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.146.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.147.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.148.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.149.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.150.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.151.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.152.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.153.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.154.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.155.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.156.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.157.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.158.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.experts.159.down_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.shared_experts.gate_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.30.mlp.shared_experts.up_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.self_attn.o_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.input_layernorm.weight": "model-00041-of-00132.safetensors", + "model.layers.31.self_attn.q_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.self_attn.k_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.self_attn.v_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.self_attn.q_proj.bias": "model-00041-of-00132.safetensors", + "model.layers.31.self_attn.k_proj.bias": "model-00041-of-00132.safetensors", + "model.layers.31.self_attn.v_proj.bias": "model-00041-of-00132.safetensors", + "model.layers.31.self_attn.q_norm.weight": "model-00041-of-00132.safetensors", + "model.layers.31.self_attn.k_norm.weight": "model-00041-of-00132.safetensors", + "model.layers.31.post_attention_layernorm.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.gate.e_score_correction_bias": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.0.gate_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.0.up_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.1.gate_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.1.up_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.2.gate_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.2.up_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.3.gate_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.3.up_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.4.gate_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.4.up_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.5.gate_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.5.up_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.6.gate_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.6.up_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.7.gate_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.7.up_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.8.gate_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.8.up_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.9.gate_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.9.up_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.10.gate_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.10.up_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.11.gate_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.11.up_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.12.gate_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.12.up_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.13.gate_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.13.up_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.14.gate_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.14.up_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.15.gate_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.15.up_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.16.gate_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.16.up_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.17.gate_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.17.up_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.18.gate_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.18.up_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.19.gate_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.19.up_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.20.gate_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.20.up_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.21.gate_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.21.up_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.22.gate_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.22.up_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.23.gate_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.23.up_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.24.gate_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.24.up_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.25.gate_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.25.up_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.26.gate_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.26.up_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.27.gate_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.27.up_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.28.gate_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.28.up_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.29.gate_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.29.up_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.30.gate_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.30.up_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.31.gate_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.31.up_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.32.gate_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.32.up_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.33.gate_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.33.up_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.34.gate_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.34.up_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.35.gate_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.35.up_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.36.gate_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.36.up_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.37.gate_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.37.up_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.38.gate_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.38.up_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.39.gate_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.39.up_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.40.gate_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.40.up_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.41.gate_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.41.up_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.42.gate_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.42.up_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.43.gate_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.43.up_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.44.gate_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.44.up_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.45.gate_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.45.up_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.46.gate_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.46.up_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.47.gate_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.47.up_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.48.gate_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.48.up_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.49.gate_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.49.up_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.50.gate_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.50.up_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.51.gate_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.51.up_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.52.gate_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.52.up_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.53.gate_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.53.up_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.54.gate_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.54.up_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.55.gate_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.55.up_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.56.gate_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.56.up_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.57.gate_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.57.up_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.58.gate_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.58.up_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.59.gate_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.59.up_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.60.gate_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.60.up_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.61.gate_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.61.up_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.62.gate_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.62.up_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.63.gate_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.63.up_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.64.gate_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.64.up_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.65.gate_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.65.up_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.66.gate_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.66.up_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.67.gate_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.67.up_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.68.gate_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.68.up_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.69.gate_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.69.up_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.70.gate_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.70.up_proj.weight": "model-00041-of-00132.safetensors", + "model.layers.31.mlp.experts.71.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.71.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.72.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.72.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.73.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.73.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.74.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.74.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.75.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.75.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.76.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.76.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.77.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.77.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.78.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.78.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.79.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.79.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.80.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.80.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.81.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.81.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.82.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.82.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.83.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.83.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.84.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.84.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.85.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.85.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.86.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.86.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.87.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.87.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.88.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.88.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.89.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.89.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.90.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.90.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.91.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.91.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.92.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.92.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.93.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.93.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.94.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.94.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.95.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.95.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.96.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.96.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.97.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.97.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.98.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.98.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.99.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.99.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.100.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.100.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.101.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.101.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.102.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.102.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.103.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.103.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.104.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.104.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.105.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.105.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.106.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.106.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.107.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.107.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.108.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.108.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.109.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.109.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.110.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.110.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.111.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.111.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.112.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.112.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.113.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.113.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.114.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.114.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.115.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.115.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.116.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.116.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.117.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.117.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.118.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.118.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.119.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.119.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.120.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.120.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.121.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.121.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.122.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.122.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.123.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.123.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.124.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.124.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.125.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.125.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.126.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.126.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.127.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.127.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.128.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.128.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.129.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.129.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.130.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.130.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.131.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.131.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.132.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.132.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.133.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.133.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.134.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.134.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.135.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.135.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.136.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.136.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.137.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.137.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.138.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.138.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.139.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.139.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.140.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.140.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.141.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.141.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.142.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.142.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.143.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.143.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.144.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.144.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.145.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.145.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.146.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.146.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.147.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.147.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.148.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.148.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.149.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.149.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.150.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.150.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.151.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.151.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.152.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.152.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.153.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.153.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.154.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.154.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.155.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.155.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.156.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.156.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.157.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.157.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.158.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.158.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.159.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.159.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.0.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.1.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.2.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.3.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.4.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.5.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.6.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.7.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.8.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.9.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.10.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.11.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.12.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.13.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.14.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.15.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.16.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.17.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.18.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.19.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.20.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.21.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.22.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.23.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.24.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.25.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.26.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.27.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.28.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.29.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.30.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.31.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.32.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.33.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.34.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.35.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.36.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.37.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.38.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.39.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.40.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.41.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.42.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.43.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.44.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.45.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.46.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.47.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.48.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.49.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.50.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.51.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.52.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.53.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.54.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.55.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.56.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.57.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.58.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.59.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.60.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.61.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.62.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.63.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.64.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.65.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.66.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.67.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.68.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.69.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.70.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.71.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.72.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.73.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.74.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.75.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.76.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.77.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.78.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.79.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.80.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.81.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.82.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.83.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.84.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.85.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.86.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.87.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.88.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.89.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.90.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.91.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.92.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.93.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.94.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.95.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.96.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.97.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.98.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.99.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.100.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.101.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.102.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.103.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.104.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.105.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.106.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.107.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.108.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.109.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.110.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.111.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.112.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.113.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.114.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.115.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.116.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.117.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.118.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.119.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.120.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.121.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.122.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.123.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.124.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.125.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.126.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.127.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.128.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.129.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.130.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.131.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.132.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.133.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.134.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.135.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.136.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.137.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.138.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.139.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.140.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.141.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.142.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.143.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.144.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.145.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.146.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.147.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.148.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.149.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.150.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.151.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.152.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.153.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.154.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.155.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.156.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.157.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.158.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.experts.159.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.shared_experts.gate_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.shared_experts.up_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.31.mlp.shared_experts.down_proj.weight": "model-00042-of-00132.safetensors", + "model.layers.32.input_layernorm.weight": "model-00042-of-00132.safetensors", + "model.layers.32.self_attn.q_proj.bias": "model-00042-of-00132.safetensors", + "model.layers.32.self_attn.k_proj.bias": "model-00042-of-00132.safetensors", + "model.layers.32.self_attn.v_proj.bias": "model-00042-of-00132.safetensors", + "model.layers.32.self_attn.q_norm.weight": "model-00042-of-00132.safetensors", + "model.layers.32.self_attn.k_norm.weight": "model-00042-of-00132.safetensors", + "model.layers.32.post_attention_layernorm.weight": "model-00042-of-00132.safetensors", + "model.layers.32.mlp.gate.weight": "model-00042-of-00132.safetensors", + "model.layers.32.mlp.gate.e_score_correction_bias": "model-00042-of-00132.safetensors", + "model.layers.32.mlp.experts.0.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.0.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.1.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.1.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.2.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.2.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.3.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.3.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.4.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.4.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.5.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.5.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.6.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.6.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.7.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.7.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.8.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.8.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.9.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.9.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.10.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.10.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.11.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.11.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.12.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.12.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.13.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.13.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.14.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.14.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.15.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.15.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.16.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.16.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.17.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.17.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.18.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.18.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.19.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.19.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.20.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.20.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.21.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.21.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.22.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.22.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.23.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.23.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.24.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.24.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.25.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.25.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.26.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.26.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.27.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.27.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.28.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.28.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.29.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.29.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.30.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.30.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.31.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.31.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.32.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.32.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.33.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.33.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.34.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.34.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.35.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.35.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.36.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.36.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.37.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.37.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.38.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.38.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.39.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.39.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.40.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.40.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.41.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.41.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.42.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.42.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.43.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.43.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.44.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.44.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.45.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.45.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.46.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.46.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.47.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.47.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.48.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.48.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.49.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.49.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.50.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.50.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.51.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.51.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.52.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.52.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.53.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.53.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.54.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.54.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.55.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.55.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.56.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.56.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.57.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.57.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.58.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.58.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.59.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.59.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.60.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.60.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.61.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.61.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.62.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.62.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.63.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.63.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.64.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.64.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.65.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.65.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.66.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.66.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.67.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.67.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.68.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.68.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.69.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.69.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.70.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.70.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.71.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.71.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.72.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.72.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.73.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.73.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.74.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.74.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.75.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.75.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.76.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.76.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.77.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.77.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.78.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.78.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.79.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.79.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.80.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.80.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.81.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.81.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.82.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.82.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.83.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.83.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.84.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.84.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.85.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.85.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.86.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.86.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.87.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.87.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.88.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.88.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.89.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.89.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.90.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.90.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.91.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.91.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.92.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.92.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.93.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.93.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.94.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.94.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.95.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.95.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.96.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.96.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.97.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.97.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.98.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.98.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.99.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.99.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.100.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.100.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.101.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.101.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.102.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.102.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.103.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.103.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.104.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.104.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.105.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.105.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.106.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.106.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.107.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.107.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.108.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.108.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.109.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.109.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.110.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.110.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.111.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.111.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.112.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.112.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.113.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.113.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.114.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.114.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.115.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.115.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.116.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.116.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.117.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.117.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.118.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.118.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.119.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.119.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.120.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.120.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.121.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.121.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.122.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.122.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.123.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.123.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.124.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.124.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.125.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.125.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.126.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.126.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.127.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.127.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.128.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.128.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.129.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.129.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.130.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.130.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.131.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.131.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.132.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.132.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.133.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.133.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.134.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.134.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.135.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.135.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.136.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.136.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.137.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.137.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.138.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.138.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.139.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.139.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.140.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.140.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.141.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.141.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.142.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.142.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.143.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.143.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.144.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.144.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.145.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.145.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.146.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.146.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.147.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.147.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.148.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.148.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.149.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.149.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.150.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.150.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.151.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.151.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.152.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.152.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.153.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.153.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.154.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.154.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.155.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.155.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.156.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.156.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.157.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.157.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.158.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.158.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.159.gate_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.159.up_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.0.down_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.1.down_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.2.down_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.3.down_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.4.down_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.5.down_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.6.down_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.7.down_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.8.down_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.9.down_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.10.down_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.11.down_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.12.down_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.13.down_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.14.down_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.15.down_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.16.down_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.17.down_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.18.down_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.19.down_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.20.down_proj.weight": "model-00043-of-00132.safetensors", + "model.layers.32.mlp.experts.21.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.22.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.23.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.24.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.25.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.26.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.27.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.28.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.29.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.30.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.31.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.32.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.33.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.34.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.35.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.36.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.37.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.38.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.39.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.40.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.41.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.42.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.43.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.44.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.45.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.46.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.47.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.48.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.49.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.50.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.51.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.52.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.53.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.54.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.55.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.56.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.57.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.58.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.59.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.60.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.61.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.62.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.63.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.64.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.65.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.66.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.67.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.68.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.69.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.70.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.71.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.72.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.73.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.74.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.75.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.76.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.77.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.78.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.79.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.80.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.81.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.82.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.83.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.84.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.85.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.86.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.87.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.88.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.89.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.90.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.91.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.92.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.93.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.94.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.95.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.96.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.97.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.98.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.99.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.100.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.101.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.102.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.103.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.104.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.105.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.106.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.107.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.108.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.109.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.110.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.111.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.112.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.113.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.114.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.115.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.116.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.117.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.118.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.119.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.120.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.121.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.122.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.123.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.124.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.125.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.126.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.127.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.128.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.129.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.130.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.131.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.132.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.133.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.134.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.135.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.136.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.137.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.138.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.139.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.140.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.141.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.142.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.143.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.144.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.145.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.146.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.147.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.148.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.149.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.150.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.151.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.152.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.153.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.154.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.155.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.156.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.157.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.158.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.experts.159.down_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.shared_experts.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.32.mlp.shared_experts.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.self_attn.o_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.input_layernorm.weight": "model-00044-of-00132.safetensors", + "model.layers.33.self_attn.q_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.self_attn.k_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.self_attn.v_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.self_attn.q_proj.bias": "model-00044-of-00132.safetensors", + "model.layers.33.self_attn.k_proj.bias": "model-00044-of-00132.safetensors", + "model.layers.33.self_attn.v_proj.bias": "model-00044-of-00132.safetensors", + "model.layers.33.self_attn.q_norm.weight": "model-00044-of-00132.safetensors", + "model.layers.33.self_attn.k_norm.weight": "model-00044-of-00132.safetensors", + "model.layers.33.post_attention_layernorm.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.gate.e_score_correction_bias": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.0.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.0.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.1.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.1.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.2.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.2.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.3.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.3.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.4.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.4.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.5.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.5.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.6.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.6.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.7.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.7.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.8.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.8.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.9.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.9.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.10.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.10.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.11.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.11.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.12.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.12.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.13.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.13.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.14.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.14.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.15.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.15.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.16.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.16.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.17.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.17.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.18.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.18.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.19.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.19.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.20.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.20.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.21.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.21.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.22.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.22.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.23.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.23.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.24.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.24.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.25.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.25.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.26.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.26.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.27.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.27.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.28.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.28.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.29.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.29.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.30.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.30.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.31.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.31.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.32.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.32.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.33.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.33.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.34.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.34.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.35.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.35.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.36.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.36.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.37.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.37.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.38.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.38.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.39.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.39.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.40.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.40.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.41.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.41.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.42.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.42.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.43.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.43.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.44.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.44.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.45.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.45.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.46.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.46.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.47.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.47.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.48.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.48.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.49.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.49.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.50.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.50.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.51.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.51.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.52.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.52.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.53.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.53.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.54.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.54.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.55.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.55.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.56.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.56.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.57.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.57.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.58.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.58.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.59.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.59.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.60.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.60.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.61.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.61.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.62.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.62.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.63.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.63.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.64.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.64.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.65.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.65.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.66.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.66.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.67.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.67.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.68.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.68.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.69.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.69.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.70.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.70.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.71.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.71.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.72.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.72.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.73.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.73.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.74.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.74.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.75.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.75.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.76.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.76.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.77.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.77.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.78.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.78.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.79.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.79.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.80.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.80.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.81.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.81.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.82.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.82.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.83.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.83.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.84.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.84.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.85.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.85.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.86.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.86.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.87.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.87.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.88.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.88.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.89.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.89.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.90.gate_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.90.up_proj.weight": "model-00044-of-00132.safetensors", + "model.layers.33.mlp.experts.91.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.91.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.92.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.92.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.93.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.93.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.94.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.94.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.95.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.95.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.96.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.96.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.97.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.97.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.98.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.98.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.99.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.99.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.100.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.100.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.101.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.101.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.102.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.102.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.103.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.103.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.104.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.104.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.105.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.105.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.106.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.106.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.107.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.107.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.108.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.108.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.109.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.109.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.110.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.110.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.111.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.111.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.112.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.112.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.113.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.113.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.114.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.114.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.115.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.115.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.116.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.116.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.117.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.117.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.118.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.118.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.119.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.119.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.120.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.120.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.121.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.121.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.122.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.122.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.123.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.123.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.124.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.124.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.125.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.125.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.126.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.126.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.127.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.127.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.128.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.128.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.129.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.129.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.130.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.130.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.131.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.131.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.132.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.132.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.133.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.133.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.134.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.134.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.135.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.135.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.136.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.136.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.137.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.137.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.138.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.138.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.139.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.139.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.140.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.140.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.141.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.141.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.142.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.142.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.143.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.143.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.144.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.144.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.145.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.145.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.146.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.146.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.147.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.147.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.148.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.148.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.149.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.149.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.150.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.150.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.151.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.151.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.152.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.152.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.153.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.153.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.154.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.154.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.155.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.155.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.156.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.156.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.157.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.157.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.158.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.158.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.159.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.159.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.0.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.1.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.2.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.3.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.4.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.5.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.6.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.7.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.8.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.9.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.10.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.11.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.12.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.13.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.14.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.15.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.16.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.17.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.18.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.19.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.20.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.21.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.22.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.23.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.24.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.25.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.26.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.27.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.28.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.29.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.30.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.31.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.32.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.33.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.34.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.35.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.36.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.37.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.38.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.39.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.40.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.41.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.42.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.43.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.44.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.45.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.46.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.47.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.48.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.49.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.50.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.51.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.52.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.53.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.54.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.55.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.56.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.57.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.58.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.59.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.60.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.61.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.62.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.63.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.64.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.65.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.66.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.67.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.68.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.69.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.70.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.71.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.72.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.73.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.74.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.75.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.76.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.77.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.78.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.79.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.80.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.81.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.82.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.83.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.84.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.85.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.86.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.87.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.88.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.89.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.90.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.91.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.92.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.93.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.94.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.95.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.96.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.97.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.98.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.99.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.100.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.101.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.102.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.103.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.104.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.105.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.106.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.107.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.108.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.109.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.110.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.111.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.112.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.113.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.114.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.115.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.116.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.117.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.118.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.119.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.120.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.121.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.122.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.123.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.124.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.125.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.126.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.127.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.128.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.129.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.130.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.131.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.132.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.133.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.134.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.135.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.136.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.137.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.138.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.139.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.140.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.141.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.142.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.143.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.144.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.145.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.146.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.147.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.148.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.149.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.150.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.151.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.152.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.153.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.154.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.155.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.156.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.157.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.158.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.experts.159.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.shared_experts.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.shared_experts.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.33.mlp.shared_experts.down_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.34.input_layernorm.weight": "model-00045-of-00132.safetensors", + "model.layers.34.self_attn.q_proj.bias": "model-00045-of-00132.safetensors", + "model.layers.34.self_attn.k_proj.bias": "model-00045-of-00132.safetensors", + "model.layers.34.self_attn.v_proj.bias": "model-00045-of-00132.safetensors", + "model.layers.34.self_attn.q_norm.weight": "model-00045-of-00132.safetensors", + "model.layers.34.self_attn.k_norm.weight": "model-00045-of-00132.safetensors", + "model.layers.34.post_attention_layernorm.weight": "model-00045-of-00132.safetensors", + "model.layers.34.mlp.gate.weight": "model-00045-of-00132.safetensors", + "model.layers.34.mlp.gate.e_score_correction_bias": "model-00045-of-00132.safetensors", + "model.layers.34.mlp.experts.0.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.34.mlp.experts.0.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.34.mlp.experts.1.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.34.mlp.experts.1.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.34.mlp.experts.2.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.34.mlp.experts.2.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.34.mlp.experts.3.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.34.mlp.experts.3.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.34.mlp.experts.4.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.34.mlp.experts.4.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.34.mlp.experts.5.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.34.mlp.experts.5.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.34.mlp.experts.6.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.34.mlp.experts.6.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.34.mlp.experts.7.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.34.mlp.experts.7.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.34.mlp.experts.8.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.34.mlp.experts.8.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.34.mlp.experts.9.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.34.mlp.experts.9.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.34.mlp.experts.10.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.34.mlp.experts.10.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.34.mlp.experts.11.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.34.mlp.experts.11.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.34.mlp.experts.12.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.34.mlp.experts.12.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.34.mlp.experts.13.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.34.mlp.experts.13.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.34.mlp.experts.14.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.34.mlp.experts.14.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.34.mlp.experts.15.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.34.mlp.experts.15.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.34.mlp.experts.16.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.34.mlp.experts.16.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.34.mlp.experts.17.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.34.mlp.experts.17.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.34.mlp.experts.18.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.34.mlp.experts.18.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.34.mlp.experts.19.gate_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.34.mlp.experts.19.up_proj.weight": "model-00045-of-00132.safetensors", + "model.layers.34.mlp.experts.20.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.20.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.21.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.21.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.22.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.22.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.23.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.23.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.24.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.24.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.25.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.25.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.26.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.26.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.27.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.27.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.28.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.28.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.29.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.29.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.30.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.30.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.31.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.31.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.32.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.32.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.33.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.33.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.34.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.34.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.35.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.35.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.36.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.36.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.37.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.37.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.38.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.38.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.39.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.39.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.40.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.40.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.41.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.41.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.42.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.42.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.43.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.43.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.44.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.44.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.45.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.45.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.46.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.46.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.47.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.47.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.48.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.48.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.49.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.49.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.50.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.50.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.51.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.51.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.52.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.52.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.53.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.53.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.54.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.54.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.55.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.55.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.56.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.56.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.57.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.57.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.58.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.58.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.59.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.59.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.60.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.60.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.61.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.61.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.62.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.62.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.63.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.63.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.64.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.64.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.65.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.65.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.66.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.66.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.67.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.67.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.68.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.68.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.69.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.69.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.70.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.70.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.71.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.71.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.72.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.72.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.73.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.73.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.74.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.74.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.75.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.75.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.76.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.76.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.77.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.77.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.78.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.78.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.79.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.79.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.80.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.80.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.81.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.81.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.82.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.82.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.83.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.83.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.84.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.84.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.85.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.85.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.86.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.86.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.87.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.87.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.88.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.88.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.89.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.89.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.90.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.90.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.91.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.91.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.92.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.92.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.93.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.93.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.94.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.94.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.95.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.95.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.96.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.96.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.97.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.97.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.98.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.98.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.99.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.99.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.100.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.100.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.101.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.101.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.102.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.102.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.103.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.103.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.104.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.104.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.105.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.105.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.106.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.106.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.107.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.107.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.108.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.108.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.109.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.109.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.110.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.110.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.111.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.111.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.112.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.112.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.113.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.113.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.114.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.114.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.115.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.115.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.116.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.116.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.117.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.117.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.118.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.118.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.119.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.119.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.120.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.120.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.121.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.121.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.122.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.122.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.123.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.123.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.124.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.124.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.125.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.125.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.126.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.126.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.127.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.127.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.128.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.128.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.129.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.129.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.130.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.130.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.131.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.131.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.132.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.132.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.133.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.133.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.134.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.134.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.135.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.135.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.136.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.136.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.137.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.137.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.138.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.138.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.139.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.139.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.140.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.140.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.141.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.141.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.142.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.142.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.143.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.143.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.144.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.144.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.145.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.145.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.146.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.146.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.147.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.147.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.148.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.148.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.149.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.149.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.150.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.150.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.151.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.151.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.152.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.152.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.153.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.153.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.154.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.154.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.155.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.155.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.156.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.156.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.157.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.157.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.158.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.158.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.159.gate_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.159.up_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.0.down_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.1.down_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.2.down_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.3.down_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.4.down_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.5.down_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.6.down_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.7.down_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.8.down_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.9.down_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.10.down_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.11.down_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.12.down_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.13.down_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.14.down_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.15.down_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.16.down_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.17.down_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.18.down_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.19.down_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.20.down_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.21.down_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.22.down_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.23.down_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.24.down_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.25.down_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.26.down_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.27.down_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.28.down_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.29.down_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.30.down_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.31.down_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.32.down_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.33.down_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.34.down_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.35.down_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.36.down_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.37.down_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.38.down_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.39.down_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.40.down_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.41.down_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.42.down_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.43.down_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.44.down_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.45.down_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.46.down_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.47.down_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.48.down_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.49.down_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.50.down_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.51.down_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.52.down_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.53.down_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.54.down_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.55.down_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.56.down_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.57.down_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.58.down_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.59.down_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.60.down_proj.weight": "model-00046-of-00132.safetensors", + "model.layers.34.mlp.experts.61.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.62.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.63.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.64.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.65.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.66.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.67.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.68.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.69.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.70.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.71.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.72.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.73.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.74.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.75.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.76.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.77.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.78.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.79.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.80.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.81.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.82.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.83.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.84.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.85.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.86.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.87.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.88.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.89.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.90.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.91.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.92.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.93.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.94.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.95.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.96.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.97.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.98.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.99.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.100.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.101.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.102.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.103.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.104.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.105.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.106.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.107.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.108.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.109.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.110.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.111.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.112.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.113.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.114.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.115.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.116.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.117.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.118.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.119.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.120.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.121.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.122.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.123.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.124.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.125.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.126.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.127.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.128.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.129.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.130.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.131.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.132.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.133.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.134.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.135.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.136.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.137.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.138.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.139.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.140.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.141.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.142.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.143.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.144.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.145.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.146.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.147.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.148.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.149.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.150.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.151.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.152.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.153.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.154.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.155.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.156.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.157.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.158.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.experts.159.down_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.shared_experts.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.34.mlp.shared_experts.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.self_attn.o_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.input_layernorm.weight": "model-00047-of-00132.safetensors", + "model.layers.35.self_attn.q_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.self_attn.k_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.self_attn.v_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.self_attn.q_proj.bias": "model-00047-of-00132.safetensors", + "model.layers.35.self_attn.k_proj.bias": "model-00047-of-00132.safetensors", + "model.layers.35.self_attn.v_proj.bias": "model-00047-of-00132.safetensors", + "model.layers.35.self_attn.q_norm.weight": "model-00047-of-00132.safetensors", + "model.layers.35.self_attn.k_norm.weight": "model-00047-of-00132.safetensors", + "model.layers.35.post_attention_layernorm.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.gate.e_score_correction_bias": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.0.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.0.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.1.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.1.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.2.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.2.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.3.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.3.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.4.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.4.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.5.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.5.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.6.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.6.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.7.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.7.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.8.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.8.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.9.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.9.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.10.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.10.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.11.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.11.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.12.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.12.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.13.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.13.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.14.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.14.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.15.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.15.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.16.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.16.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.17.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.17.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.18.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.18.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.19.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.19.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.20.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.20.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.21.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.21.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.22.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.22.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.23.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.23.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.24.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.24.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.25.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.25.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.26.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.26.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.27.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.27.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.28.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.28.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.29.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.29.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.30.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.30.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.31.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.31.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.32.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.32.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.33.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.33.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.34.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.34.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.35.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.35.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.36.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.36.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.37.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.37.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.38.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.38.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.39.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.39.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.40.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.40.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.41.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.41.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.42.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.42.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.43.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.43.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.44.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.44.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.45.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.45.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.46.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.46.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.47.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.47.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.48.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.48.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.49.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.49.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.50.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.50.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.51.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.51.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.52.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.52.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.53.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.53.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.54.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.54.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.55.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.55.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.56.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.56.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.57.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.57.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.58.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.58.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.59.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.59.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.60.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.60.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.61.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.61.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.62.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.62.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.63.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.63.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.64.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.64.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.65.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.65.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.66.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.66.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.67.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.67.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.68.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.68.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.69.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.69.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.70.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.70.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.71.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.71.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.72.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.72.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.73.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.73.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.74.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.74.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.75.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.75.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.76.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.76.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.77.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.77.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.78.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.78.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.79.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.79.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.80.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.80.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.81.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.81.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.82.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.82.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.83.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.83.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.84.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.84.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.85.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.85.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.86.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.86.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.87.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.87.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.88.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.88.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.89.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.89.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.90.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.90.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.91.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.91.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.92.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.92.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.93.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.93.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.94.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.94.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.95.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.95.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.96.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.96.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.97.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.97.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.98.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.98.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.99.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.99.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.100.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.100.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.101.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.101.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.102.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.102.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.103.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.103.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.104.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.104.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.105.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.105.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.106.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.106.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.107.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.107.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.108.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.108.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.109.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.109.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.110.gate_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.110.up_proj.weight": "model-00047-of-00132.safetensors", + "model.layers.35.mlp.experts.111.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.111.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.112.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.112.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.113.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.113.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.114.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.114.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.115.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.115.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.116.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.116.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.117.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.117.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.118.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.118.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.119.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.119.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.120.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.120.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.121.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.121.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.122.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.122.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.123.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.123.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.124.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.124.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.125.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.125.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.126.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.126.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.127.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.127.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.128.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.128.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.129.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.129.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.130.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.130.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.131.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.131.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.132.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.132.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.133.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.133.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.134.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.134.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.135.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.135.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.136.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.136.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.137.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.137.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.138.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.138.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.139.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.139.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.140.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.140.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.141.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.141.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.142.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.142.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.143.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.143.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.144.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.144.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.145.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.145.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.146.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.146.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.147.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.147.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.148.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.148.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.149.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.149.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.150.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.150.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.151.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.151.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.152.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.152.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.153.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.153.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.154.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.154.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.155.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.155.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.156.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.156.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.157.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.157.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.158.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.158.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.159.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.159.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.0.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.1.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.2.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.3.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.4.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.5.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.6.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.7.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.8.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.9.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.10.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.11.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.12.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.13.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.14.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.15.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.16.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.17.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.18.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.19.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.20.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.21.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.22.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.23.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.24.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.25.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.26.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.27.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.28.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.29.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.30.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.31.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.32.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.33.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.34.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.35.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.36.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.37.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.38.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.39.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.40.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.41.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.42.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.43.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.44.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.45.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.46.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.47.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.48.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.49.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.50.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.51.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.52.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.53.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.54.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.55.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.56.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.57.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.58.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.59.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.60.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.61.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.62.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.63.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.64.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.65.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.66.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.67.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.68.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.69.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.70.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.71.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.72.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.73.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.74.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.75.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.76.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.77.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.78.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.79.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.80.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.81.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.82.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.83.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.84.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.85.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.86.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.87.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.88.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.89.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.90.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.91.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.92.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.93.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.94.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.95.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.96.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.97.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.98.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.99.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.100.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.101.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.102.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.103.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.104.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.105.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.106.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.107.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.108.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.109.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.110.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.111.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.112.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.113.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.114.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.115.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.116.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.117.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.118.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.119.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.120.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.121.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.122.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.123.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.124.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.125.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.126.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.127.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.128.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.129.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.130.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.131.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.132.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.133.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.134.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.135.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.136.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.137.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.138.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.139.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.140.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.141.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.142.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.143.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.144.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.145.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.146.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.147.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.148.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.149.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.150.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.151.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.152.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.153.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.154.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.155.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.156.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.157.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.158.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.experts.159.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.shared_experts.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.shared_experts.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.35.mlp.shared_experts.down_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.36.input_layernorm.weight": "model-00048-of-00132.safetensors", + "model.layers.36.self_attn.q_proj.bias": "model-00048-of-00132.safetensors", + "model.layers.36.self_attn.k_proj.bias": "model-00048-of-00132.safetensors", + "model.layers.36.self_attn.v_proj.bias": "model-00048-of-00132.safetensors", + "model.layers.36.self_attn.q_norm.weight": "model-00048-of-00132.safetensors", + "model.layers.36.self_attn.k_norm.weight": "model-00048-of-00132.safetensors", + "model.layers.36.post_attention_layernorm.weight": "model-00048-of-00132.safetensors", + "model.layers.36.mlp.gate.weight": "model-00048-of-00132.safetensors", + "model.layers.36.mlp.gate.e_score_correction_bias": "model-00048-of-00132.safetensors", + "model.layers.36.mlp.experts.0.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.36.mlp.experts.0.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.36.mlp.experts.1.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.36.mlp.experts.1.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.36.mlp.experts.2.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.36.mlp.experts.2.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.36.mlp.experts.3.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.36.mlp.experts.3.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.36.mlp.experts.4.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.36.mlp.experts.4.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.36.mlp.experts.5.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.36.mlp.experts.5.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.36.mlp.experts.6.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.36.mlp.experts.6.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.36.mlp.experts.7.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.36.mlp.experts.7.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.36.mlp.experts.8.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.36.mlp.experts.8.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.36.mlp.experts.9.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.36.mlp.experts.9.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.36.mlp.experts.10.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.36.mlp.experts.10.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.36.mlp.experts.11.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.36.mlp.experts.11.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.36.mlp.experts.12.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.36.mlp.experts.12.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.36.mlp.experts.13.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.36.mlp.experts.13.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.36.mlp.experts.14.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.36.mlp.experts.14.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.36.mlp.experts.15.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.36.mlp.experts.15.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.36.mlp.experts.16.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.36.mlp.experts.16.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.36.mlp.experts.17.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.36.mlp.experts.17.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.36.mlp.experts.18.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.36.mlp.experts.18.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.36.mlp.experts.19.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.36.mlp.experts.19.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.36.mlp.experts.20.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.36.mlp.experts.20.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.36.mlp.experts.21.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.36.mlp.experts.21.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.36.mlp.experts.22.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.36.mlp.experts.22.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.36.mlp.experts.23.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.36.mlp.experts.23.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.36.mlp.experts.24.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.36.mlp.experts.24.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.36.mlp.experts.25.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.36.mlp.experts.25.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.36.mlp.experts.26.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.36.mlp.experts.26.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.36.mlp.experts.27.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.36.mlp.experts.27.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.36.mlp.experts.28.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.36.mlp.experts.28.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.36.mlp.experts.29.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.36.mlp.experts.29.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.36.mlp.experts.30.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.36.mlp.experts.30.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.36.mlp.experts.31.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.36.mlp.experts.31.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.36.mlp.experts.32.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.36.mlp.experts.32.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.36.mlp.experts.33.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.36.mlp.experts.33.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.36.mlp.experts.34.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.36.mlp.experts.34.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.36.mlp.experts.35.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.36.mlp.experts.35.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.36.mlp.experts.36.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.36.mlp.experts.36.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.36.mlp.experts.37.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.36.mlp.experts.37.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.36.mlp.experts.38.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.36.mlp.experts.38.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.36.mlp.experts.39.gate_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.36.mlp.experts.39.up_proj.weight": "model-00048-of-00132.safetensors", + "model.layers.36.mlp.experts.40.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.40.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.41.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.41.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.42.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.42.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.43.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.43.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.44.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.44.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.45.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.45.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.46.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.46.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.47.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.47.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.48.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.48.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.49.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.49.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.50.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.50.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.51.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.51.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.52.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.52.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.53.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.53.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.54.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.54.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.55.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.55.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.56.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.56.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.57.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.57.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.58.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.58.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.59.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.59.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.60.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.60.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.61.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.61.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.62.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.62.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.63.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.63.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.64.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.64.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.65.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.65.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.66.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.66.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.67.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.67.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.68.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.68.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.69.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.69.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.70.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.70.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.71.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.71.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.72.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.72.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.73.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.73.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.74.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.74.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.75.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.75.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.76.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.76.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.77.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.77.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.78.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.78.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.79.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.79.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.80.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.80.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.81.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.81.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.82.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.82.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.83.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.83.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.84.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.84.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.85.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.85.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.86.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.86.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.87.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.87.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.88.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.88.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.89.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.89.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.90.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.90.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.91.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.91.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.92.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.92.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.93.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.93.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.94.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.94.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.95.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.95.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.96.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.96.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.97.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.97.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.98.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.98.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.99.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.99.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.100.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.100.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.101.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.101.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.102.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.102.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.103.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.103.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.104.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.104.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.105.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.105.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.106.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.106.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.107.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.107.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.108.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.108.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.109.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.109.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.110.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.110.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.111.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.111.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.112.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.112.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.113.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.113.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.114.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.114.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.115.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.115.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.116.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.116.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.117.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.117.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.118.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.118.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.119.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.119.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.120.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.120.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.121.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.121.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.122.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.122.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.123.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.123.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.124.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.124.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.125.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.125.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.126.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.126.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.127.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.127.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.128.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.128.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.129.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.129.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.130.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.130.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.131.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.131.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.132.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.132.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.133.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.133.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.134.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.134.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.135.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.135.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.136.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.136.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.137.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.137.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.138.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.138.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.139.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.139.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.140.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.140.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.141.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.141.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.142.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.142.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.143.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.143.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.144.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.144.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.145.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.145.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.146.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.146.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.147.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.147.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.148.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.148.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.149.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.149.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.150.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.150.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.151.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.151.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.152.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.152.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.153.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.153.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.154.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.154.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.155.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.155.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.156.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.156.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.157.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.157.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.158.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.158.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.159.gate_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.159.up_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.0.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.1.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.2.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.3.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.4.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.5.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.6.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.7.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.8.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.9.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.10.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.11.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.12.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.13.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.14.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.15.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.16.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.17.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.18.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.19.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.20.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.21.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.22.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.23.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.24.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.25.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.26.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.27.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.28.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.29.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.30.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.31.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.32.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.33.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.34.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.35.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.36.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.37.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.38.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.39.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.40.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.41.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.42.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.43.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.44.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.45.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.46.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.47.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.48.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.49.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.50.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.51.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.52.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.53.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.54.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.55.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.56.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.57.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.58.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.59.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.60.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.61.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.62.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.63.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.64.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.65.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.66.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.67.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.68.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.69.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.70.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.71.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.72.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.73.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.74.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.75.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.76.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.77.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.78.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.79.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.80.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.81.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.82.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.83.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.84.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.85.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.86.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.87.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.88.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.89.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.90.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.91.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.92.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.93.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.94.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.95.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.96.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.97.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.98.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.99.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.100.down_proj.weight": "model-00049-of-00132.safetensors", + "model.layers.36.mlp.experts.101.down_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.36.mlp.experts.102.down_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.36.mlp.experts.103.down_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.36.mlp.experts.104.down_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.36.mlp.experts.105.down_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.36.mlp.experts.106.down_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.36.mlp.experts.107.down_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.36.mlp.experts.108.down_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.36.mlp.experts.109.down_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.36.mlp.experts.110.down_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.36.mlp.experts.111.down_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.36.mlp.experts.112.down_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.36.mlp.experts.113.down_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.36.mlp.experts.114.down_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.36.mlp.experts.115.down_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.36.mlp.experts.116.down_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.36.mlp.experts.117.down_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.36.mlp.experts.118.down_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.36.mlp.experts.119.down_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.36.mlp.experts.120.down_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.36.mlp.experts.121.down_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.36.mlp.experts.122.down_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.36.mlp.experts.123.down_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.36.mlp.experts.124.down_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.36.mlp.experts.125.down_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.36.mlp.experts.126.down_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.36.mlp.experts.127.down_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.36.mlp.experts.128.down_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.36.mlp.experts.129.down_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.36.mlp.experts.130.down_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.36.mlp.experts.131.down_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.36.mlp.experts.132.down_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.36.mlp.experts.133.down_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.36.mlp.experts.134.down_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.36.mlp.experts.135.down_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.36.mlp.experts.136.down_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.36.mlp.experts.137.down_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.36.mlp.experts.138.down_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.36.mlp.experts.139.down_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.36.mlp.experts.140.down_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.36.mlp.experts.141.down_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.36.mlp.experts.142.down_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.36.mlp.experts.143.down_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.36.mlp.experts.144.down_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.36.mlp.experts.145.down_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.36.mlp.experts.146.down_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.36.mlp.experts.147.down_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.36.mlp.experts.148.down_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.36.mlp.experts.149.down_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.36.mlp.experts.150.down_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.36.mlp.experts.151.down_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.36.mlp.experts.152.down_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.36.mlp.experts.153.down_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.36.mlp.experts.154.down_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.36.mlp.experts.155.down_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.36.mlp.experts.156.down_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.36.mlp.experts.157.down_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.36.mlp.experts.158.down_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.36.mlp.experts.159.down_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.36.mlp.shared_experts.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.36.mlp.shared_experts.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.self_attn.o_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.input_layernorm.weight": "model-00050-of-00132.safetensors", + "model.layers.37.self_attn.q_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.self_attn.k_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.self_attn.v_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.self_attn.q_proj.bias": "model-00050-of-00132.safetensors", + "model.layers.37.self_attn.k_proj.bias": "model-00050-of-00132.safetensors", + "model.layers.37.self_attn.v_proj.bias": "model-00050-of-00132.safetensors", + "model.layers.37.self_attn.q_norm.weight": "model-00050-of-00132.safetensors", + "model.layers.37.self_attn.k_norm.weight": "model-00050-of-00132.safetensors", + "model.layers.37.post_attention_layernorm.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.gate.e_score_correction_bias": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.0.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.0.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.1.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.1.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.2.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.2.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.3.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.3.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.4.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.4.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.5.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.5.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.6.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.6.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.7.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.7.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.8.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.8.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.9.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.9.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.10.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.10.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.11.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.11.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.12.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.12.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.13.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.13.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.14.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.14.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.15.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.15.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.16.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.16.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.17.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.17.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.18.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.18.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.19.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.19.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.20.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.20.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.21.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.21.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.22.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.22.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.23.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.23.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.24.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.24.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.25.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.25.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.26.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.26.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.27.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.27.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.28.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.28.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.29.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.29.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.30.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.30.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.31.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.31.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.32.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.32.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.33.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.33.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.34.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.34.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.35.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.35.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.36.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.36.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.37.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.37.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.38.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.38.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.39.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.39.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.40.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.40.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.41.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.41.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.42.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.42.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.43.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.43.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.44.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.44.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.45.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.45.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.46.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.46.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.47.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.47.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.48.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.48.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.49.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.49.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.50.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.50.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.51.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.51.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.52.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.52.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.53.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.53.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.54.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.54.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.55.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.55.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.56.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.56.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.57.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.57.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.58.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.58.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.59.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.59.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.60.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.60.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.61.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.61.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.62.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.62.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.63.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.63.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.64.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.64.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.65.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.65.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.66.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.66.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.67.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.67.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.68.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.68.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.69.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.69.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.70.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.70.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.71.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.71.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.72.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.72.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.73.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.73.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.74.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.74.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.75.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.75.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.76.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.76.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.77.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.77.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.78.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.78.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.79.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.79.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.80.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.80.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.81.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.81.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.82.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.82.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.83.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.83.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.84.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.84.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.85.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.85.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.86.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.86.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.87.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.87.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.88.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.88.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.89.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.89.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.90.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.90.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.91.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.91.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.92.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.92.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.93.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.93.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.94.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.94.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.95.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.95.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.96.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.96.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.97.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.97.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.98.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.98.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.99.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.99.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.100.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.100.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.101.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.101.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.102.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.102.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.103.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.103.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.104.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.104.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.105.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.105.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.106.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.106.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.107.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.107.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.108.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.108.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.109.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.109.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.110.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.110.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.111.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.111.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.112.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.112.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.113.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.113.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.114.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.114.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.115.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.115.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.116.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.116.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.117.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.117.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.118.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.118.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.119.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.119.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.120.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.120.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.121.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.121.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.122.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.122.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.123.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.123.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.124.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.124.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.125.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.125.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.126.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.126.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.127.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.127.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.128.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.128.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.129.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.129.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.130.gate_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.130.up_proj.weight": "model-00050-of-00132.safetensors", + "model.layers.37.mlp.experts.131.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.131.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.132.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.132.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.133.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.133.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.134.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.134.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.135.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.135.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.136.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.136.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.137.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.137.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.138.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.138.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.139.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.139.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.140.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.140.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.141.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.141.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.142.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.142.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.143.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.143.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.144.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.144.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.145.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.145.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.146.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.146.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.147.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.147.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.148.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.148.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.149.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.149.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.150.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.150.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.151.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.151.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.152.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.152.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.153.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.153.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.154.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.154.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.155.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.155.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.156.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.156.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.157.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.157.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.158.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.158.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.159.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.159.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.0.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.1.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.2.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.3.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.4.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.5.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.6.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.7.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.8.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.9.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.10.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.11.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.12.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.13.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.14.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.15.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.16.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.17.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.18.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.19.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.20.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.21.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.22.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.23.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.24.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.25.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.26.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.27.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.28.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.29.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.30.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.31.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.32.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.33.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.34.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.35.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.36.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.37.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.38.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.39.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.40.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.41.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.42.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.43.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.44.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.45.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.46.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.47.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.48.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.49.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.50.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.51.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.52.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.53.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.54.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.55.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.56.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.57.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.58.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.59.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.60.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.61.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.62.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.63.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.64.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.65.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.66.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.67.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.68.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.69.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.70.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.71.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.72.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.73.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.74.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.75.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.76.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.77.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.78.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.79.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.80.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.81.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.82.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.83.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.84.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.85.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.86.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.87.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.88.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.89.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.90.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.91.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.92.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.93.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.94.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.95.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.96.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.97.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.98.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.99.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.100.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.101.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.102.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.103.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.104.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.105.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.106.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.107.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.108.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.109.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.110.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.111.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.112.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.113.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.114.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.115.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.116.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.117.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.118.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.119.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.120.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.121.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.122.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.123.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.124.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.125.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.126.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.127.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.128.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.129.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.130.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.131.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.132.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.133.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.134.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.135.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.136.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.137.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.138.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.139.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.140.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.141.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.142.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.143.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.144.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.145.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.146.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.147.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.148.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.149.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.150.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.151.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.152.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.153.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.154.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.155.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.156.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.157.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.158.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.experts.159.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.shared_experts.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.shared_experts.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.37.mlp.shared_experts.down_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.input_layernorm.weight": "model-00051-of-00132.safetensors", + "model.layers.38.self_attn.q_proj.bias": "model-00051-of-00132.safetensors", + "model.layers.38.self_attn.k_proj.bias": "model-00051-of-00132.safetensors", + "model.layers.38.self_attn.v_proj.bias": "model-00051-of-00132.safetensors", + "model.layers.38.self_attn.q_norm.weight": "model-00051-of-00132.safetensors", + "model.layers.38.self_attn.k_norm.weight": "model-00051-of-00132.safetensors", + "model.layers.38.post_attention_layernorm.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.gate.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.gate.e_score_correction_bias": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.0.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.0.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.1.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.1.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.2.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.2.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.3.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.3.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.4.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.4.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.5.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.5.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.6.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.6.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.7.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.7.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.8.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.8.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.9.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.9.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.10.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.10.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.11.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.11.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.12.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.12.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.13.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.13.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.14.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.14.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.15.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.15.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.16.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.16.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.17.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.17.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.18.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.18.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.19.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.19.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.20.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.20.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.21.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.21.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.22.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.22.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.23.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.23.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.24.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.24.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.25.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.25.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.26.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.26.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.27.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.27.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.28.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.28.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.29.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.29.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.30.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.30.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.31.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.31.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.32.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.32.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.33.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.33.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.34.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.34.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.35.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.35.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.36.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.36.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.37.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.37.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.38.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.38.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.39.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.39.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.40.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.40.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.41.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.41.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.42.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.42.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.43.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.43.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.44.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.44.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.45.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.45.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.46.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.46.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.47.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.47.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.48.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.48.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.49.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.49.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.50.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.50.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.51.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.51.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.52.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.52.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.53.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.53.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.54.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.54.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.55.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.55.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.56.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.56.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.57.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.57.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.58.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.58.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.59.gate_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.59.up_proj.weight": "model-00051-of-00132.safetensors", + "model.layers.38.mlp.experts.60.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.60.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.61.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.61.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.62.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.62.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.63.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.63.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.64.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.64.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.65.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.65.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.66.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.66.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.67.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.67.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.68.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.68.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.69.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.69.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.70.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.70.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.71.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.71.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.72.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.72.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.73.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.73.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.74.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.74.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.75.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.75.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.76.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.76.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.77.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.77.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.78.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.78.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.79.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.79.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.80.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.80.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.81.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.81.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.82.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.82.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.83.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.83.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.84.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.84.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.85.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.85.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.86.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.86.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.87.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.87.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.88.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.88.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.89.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.89.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.90.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.90.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.91.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.91.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.92.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.92.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.93.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.93.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.94.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.94.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.95.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.95.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.96.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.96.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.97.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.97.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.98.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.98.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.99.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.99.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.100.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.100.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.101.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.101.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.102.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.102.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.103.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.103.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.104.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.104.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.105.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.105.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.106.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.106.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.107.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.107.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.108.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.108.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.109.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.109.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.110.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.110.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.111.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.111.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.112.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.112.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.113.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.113.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.114.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.114.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.115.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.115.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.116.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.116.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.117.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.117.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.118.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.118.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.119.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.119.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.120.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.120.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.121.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.121.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.122.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.122.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.123.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.123.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.124.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.124.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.125.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.125.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.126.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.126.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.127.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.127.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.128.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.128.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.129.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.129.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.130.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.130.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.131.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.131.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.132.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.132.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.133.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.133.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.134.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.134.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.135.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.135.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.136.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.136.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.137.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.137.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.138.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.138.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.139.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.139.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.140.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.140.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.141.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.141.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.142.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.142.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.143.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.143.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.144.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.144.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.145.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.145.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.146.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.146.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.147.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.147.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.148.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.148.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.149.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.149.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.150.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.150.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.151.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.151.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.152.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.152.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.153.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.153.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.154.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.154.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.155.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.155.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.156.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.156.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.157.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.157.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.158.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.158.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.159.gate_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.159.up_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.0.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.1.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.2.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.3.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.4.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.5.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.6.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.7.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.8.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.9.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.10.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.11.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.12.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.13.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.14.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.15.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.16.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.17.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.18.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.19.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.20.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.21.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.22.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.23.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.24.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.25.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.26.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.27.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.28.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.29.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.30.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.31.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.32.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.33.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.34.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.35.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.36.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.37.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.38.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.39.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.40.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.41.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.42.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.43.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.44.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.45.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.46.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.47.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.48.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.49.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.50.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.51.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.52.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.53.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.54.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.55.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.56.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.57.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.58.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.59.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.60.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.61.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.62.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.63.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.64.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.65.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.66.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.67.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.68.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.69.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.70.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.71.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.72.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.73.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.74.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.75.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.76.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.77.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.78.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.79.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.80.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.81.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.82.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.83.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.84.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.85.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.86.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.87.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.88.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.89.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.90.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.91.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.92.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.93.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.94.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.95.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.96.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.97.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.98.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.99.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.100.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.101.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.102.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.103.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.104.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.105.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.106.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.107.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.108.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.109.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.110.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.111.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.112.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.113.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.114.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.115.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.116.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.117.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.118.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.119.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.120.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.121.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.122.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.123.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.124.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.125.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.126.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.127.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.128.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.129.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.130.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.131.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.132.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.133.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.134.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.135.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.136.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.137.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.138.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.139.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.140.down_proj.weight": "model-00052-of-00132.safetensors", + "model.layers.38.mlp.experts.141.down_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.38.mlp.experts.142.down_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.38.mlp.experts.143.down_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.38.mlp.experts.144.down_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.38.mlp.experts.145.down_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.38.mlp.experts.146.down_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.38.mlp.experts.147.down_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.38.mlp.experts.148.down_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.38.mlp.experts.149.down_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.38.mlp.experts.150.down_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.38.mlp.experts.151.down_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.38.mlp.experts.152.down_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.38.mlp.experts.153.down_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.38.mlp.experts.154.down_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.38.mlp.experts.155.down_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.38.mlp.experts.156.down_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.38.mlp.experts.157.down_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.38.mlp.experts.158.down_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.38.mlp.experts.159.down_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.38.mlp.shared_experts.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.38.mlp.shared_experts.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.self_attn.o_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.input_layernorm.weight": "model-00053-of-00132.safetensors", + "model.layers.39.self_attn.q_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.self_attn.k_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.self_attn.v_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.self_attn.q_proj.bias": "model-00053-of-00132.safetensors", + "model.layers.39.self_attn.k_proj.bias": "model-00053-of-00132.safetensors", + "model.layers.39.self_attn.v_proj.bias": "model-00053-of-00132.safetensors", + "model.layers.39.self_attn.q_norm.weight": "model-00053-of-00132.safetensors", + "model.layers.39.self_attn.k_norm.weight": "model-00053-of-00132.safetensors", + "model.layers.39.post_attention_layernorm.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.gate.e_score_correction_bias": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.0.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.0.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.1.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.1.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.2.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.2.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.3.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.3.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.4.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.4.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.5.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.5.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.6.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.6.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.7.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.7.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.8.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.8.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.9.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.9.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.10.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.10.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.11.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.11.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.12.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.12.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.13.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.13.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.14.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.14.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.15.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.15.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.16.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.16.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.17.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.17.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.18.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.18.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.19.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.19.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.20.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.20.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.21.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.21.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.22.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.22.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.23.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.23.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.24.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.24.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.25.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.25.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.26.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.26.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.27.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.27.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.28.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.28.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.29.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.29.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.30.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.30.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.31.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.31.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.32.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.32.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.33.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.33.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.34.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.34.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.35.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.35.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.36.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.36.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.37.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.37.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.38.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.38.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.39.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.39.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.40.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.40.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.41.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.41.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.42.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.42.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.43.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.43.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.44.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.44.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.45.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.45.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.46.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.46.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.47.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.47.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.48.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.48.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.49.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.49.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.50.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.50.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.51.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.51.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.52.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.52.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.53.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.53.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.54.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.54.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.55.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.55.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.56.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.56.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.57.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.57.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.58.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.58.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.59.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.59.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.60.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.60.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.61.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.61.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.62.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.62.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.63.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.63.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.64.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.64.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.65.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.65.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.66.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.66.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.67.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.67.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.68.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.68.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.69.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.69.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.70.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.70.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.71.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.71.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.72.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.72.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.73.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.73.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.74.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.74.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.75.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.75.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.76.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.76.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.77.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.77.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.78.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.78.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.79.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.79.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.80.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.80.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.81.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.81.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.82.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.82.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.83.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.83.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.84.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.84.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.85.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.85.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.86.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.86.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.87.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.87.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.88.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.88.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.89.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.89.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.90.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.90.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.91.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.91.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.92.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.92.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.93.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.93.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.94.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.94.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.95.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.95.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.96.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.96.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.97.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.97.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.98.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.98.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.99.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.99.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.100.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.100.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.101.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.101.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.102.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.102.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.103.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.103.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.104.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.104.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.105.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.105.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.106.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.106.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.107.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.107.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.108.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.108.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.109.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.109.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.110.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.110.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.111.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.111.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.112.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.112.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.113.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.113.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.114.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.114.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.115.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.115.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.116.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.116.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.117.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.117.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.118.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.118.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.119.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.119.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.120.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.120.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.121.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.121.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.122.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.122.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.123.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.123.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.124.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.124.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.125.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.125.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.126.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.126.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.127.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.127.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.128.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.128.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.129.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.129.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.130.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.130.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.131.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.131.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.132.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.132.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.133.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.133.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.134.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.134.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.135.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.135.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.136.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.136.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.137.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.137.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.138.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.138.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.139.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.139.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.140.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.140.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.141.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.141.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.142.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.142.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.143.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.143.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.144.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.144.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.145.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.145.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.146.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.146.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.147.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.147.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.148.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.148.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.149.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.149.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.150.gate_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.150.up_proj.weight": "model-00053-of-00132.safetensors", + "model.layers.39.mlp.experts.151.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.151.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.152.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.152.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.153.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.153.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.154.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.154.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.155.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.155.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.156.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.156.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.157.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.157.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.158.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.158.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.159.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.159.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.0.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.1.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.2.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.3.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.4.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.5.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.6.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.7.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.8.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.9.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.10.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.11.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.12.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.13.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.14.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.15.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.16.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.17.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.18.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.19.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.20.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.21.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.22.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.23.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.24.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.25.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.26.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.27.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.28.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.29.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.30.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.31.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.32.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.33.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.34.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.35.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.36.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.37.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.38.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.39.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.40.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.41.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.42.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.43.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.44.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.45.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.46.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.47.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.48.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.49.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.50.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.51.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.52.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.53.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.54.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.55.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.56.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.57.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.58.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.59.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.60.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.61.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.62.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.63.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.64.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.65.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.66.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.67.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.68.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.69.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.70.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.71.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.72.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.73.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.74.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.75.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.76.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.77.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.78.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.79.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.80.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.81.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.82.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.83.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.84.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.85.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.86.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.87.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.88.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.89.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.90.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.91.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.92.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.93.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.94.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.95.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.96.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.97.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.98.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.99.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.100.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.101.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.102.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.103.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.104.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.105.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.106.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.107.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.108.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.109.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.110.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.111.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.112.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.113.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.114.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.115.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.116.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.117.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.118.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.119.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.120.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.121.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.122.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.123.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.124.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.125.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.126.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.127.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.128.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.129.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.130.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.131.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.132.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.133.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.134.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.135.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.136.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.137.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.138.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.139.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.140.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.141.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.142.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.143.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.144.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.145.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.146.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.147.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.148.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.149.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.150.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.151.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.152.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.153.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.154.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.155.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.156.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.157.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.158.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.experts.159.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.shared_experts.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.shared_experts.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.39.mlp.shared_experts.down_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.input_layernorm.weight": "model-00054-of-00132.safetensors", + "model.layers.40.self_attn.q_proj.bias": "model-00054-of-00132.safetensors", + "model.layers.40.self_attn.k_proj.bias": "model-00054-of-00132.safetensors", + "model.layers.40.self_attn.v_proj.bias": "model-00054-of-00132.safetensors", + "model.layers.40.self_attn.q_norm.weight": "model-00054-of-00132.safetensors", + "model.layers.40.self_attn.k_norm.weight": "model-00054-of-00132.safetensors", + "model.layers.40.post_attention_layernorm.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.gate.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.gate.e_score_correction_bias": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.0.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.0.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.1.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.1.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.2.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.2.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.3.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.3.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.4.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.4.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.5.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.5.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.6.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.6.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.7.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.7.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.8.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.8.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.9.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.9.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.10.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.10.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.11.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.11.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.12.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.12.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.13.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.13.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.14.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.14.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.15.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.15.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.16.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.16.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.17.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.17.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.18.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.18.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.19.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.19.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.20.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.20.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.21.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.21.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.22.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.22.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.23.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.23.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.24.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.24.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.25.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.25.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.26.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.26.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.27.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.27.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.28.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.28.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.29.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.29.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.30.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.30.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.31.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.31.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.32.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.32.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.33.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.33.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.34.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.34.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.35.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.35.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.36.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.36.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.37.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.37.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.38.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.38.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.39.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.39.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.40.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.40.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.41.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.41.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.42.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.42.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.43.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.43.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.44.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.44.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.45.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.45.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.46.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.46.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.47.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.47.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.48.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.48.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.49.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.49.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.50.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.50.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.51.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.51.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.52.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.52.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.53.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.53.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.54.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.54.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.55.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.55.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.56.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.56.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.57.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.57.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.58.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.58.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.59.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.59.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.60.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.60.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.61.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.61.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.62.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.62.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.63.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.63.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.64.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.64.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.65.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.65.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.66.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.66.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.67.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.67.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.68.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.68.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.69.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.69.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.70.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.70.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.71.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.71.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.72.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.72.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.73.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.73.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.74.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.74.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.75.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.75.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.76.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.76.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.77.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.77.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.78.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.78.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.79.gate_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.79.up_proj.weight": "model-00054-of-00132.safetensors", + "model.layers.40.mlp.experts.80.gate_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.80.up_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.81.gate_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.81.up_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.82.gate_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.82.up_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.83.gate_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.83.up_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.84.gate_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.84.up_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.85.gate_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.85.up_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.86.gate_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.86.up_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.87.gate_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.87.up_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.88.gate_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.88.up_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.89.gate_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.89.up_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.90.gate_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.90.up_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.91.gate_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.91.up_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.92.gate_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.92.up_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.93.gate_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.93.up_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.94.gate_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.94.up_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.95.gate_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.95.up_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.96.gate_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.96.up_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.97.gate_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.97.up_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.98.gate_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.98.up_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.99.gate_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.99.up_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.100.gate_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.100.up_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.101.gate_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.101.up_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.102.gate_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.102.up_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.103.gate_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.103.up_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.104.gate_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.104.up_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.105.gate_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.105.up_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.106.gate_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.106.up_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.107.gate_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.107.up_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.108.gate_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.108.up_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.109.gate_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.109.up_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.110.gate_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.110.up_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.111.gate_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.111.up_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.112.gate_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.112.up_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.113.gate_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.113.up_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.114.gate_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.114.up_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.115.gate_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.115.up_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.116.gate_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.116.up_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.117.gate_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.117.up_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.118.gate_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.118.up_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.119.gate_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.119.up_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.120.gate_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.120.up_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.121.gate_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.121.up_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.122.gate_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.122.up_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.123.gate_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.123.up_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.124.gate_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.124.up_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.125.gate_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.125.up_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.126.gate_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.126.up_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.127.gate_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.127.up_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.128.gate_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.128.up_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.129.gate_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.129.up_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.130.gate_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.130.up_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.131.gate_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.131.up_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.132.gate_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.132.up_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.133.gate_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.133.up_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.134.gate_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.134.up_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.135.gate_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.135.up_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.136.gate_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.136.up_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.137.gate_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.137.up_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.138.gate_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.138.up_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.139.gate_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.139.up_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.140.gate_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.140.up_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.141.gate_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.141.up_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.142.gate_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.142.up_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.143.gate_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.143.up_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.144.gate_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.144.up_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.145.gate_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.145.up_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.146.gate_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.146.up_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.147.gate_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.147.up_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.148.gate_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.148.up_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.149.gate_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.149.up_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.150.gate_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.150.up_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.151.gate_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.151.up_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.152.gate_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.152.up_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.153.gate_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.153.up_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.154.gate_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.154.up_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.155.gate_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.155.up_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.156.gate_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.156.up_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.157.gate_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.157.up_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.158.gate_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.158.up_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.159.gate_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.159.up_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.0.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.1.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.2.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.3.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.4.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.5.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.6.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.7.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.8.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.9.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.10.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.11.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.12.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.13.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.14.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.15.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.16.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.17.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.18.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.19.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.20.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.21.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.22.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.23.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.24.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.25.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.26.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.27.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.28.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.29.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.30.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.31.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.32.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.33.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.34.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.35.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.36.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.37.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.38.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.39.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.40.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.41.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.42.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.43.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.44.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.45.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.46.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.47.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.48.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.49.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.50.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.51.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.52.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.53.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.54.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.55.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.56.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.57.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.58.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.59.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.60.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.61.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.62.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.63.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.64.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.65.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.66.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.67.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.68.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.69.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.70.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.71.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.72.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.73.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.74.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.75.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.76.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.77.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.78.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.79.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.80.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.81.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.82.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.83.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.84.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.85.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.86.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.87.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.88.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.89.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.90.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.91.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.92.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.93.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.94.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.95.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.96.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.97.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.98.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.99.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.100.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.101.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.102.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.103.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.104.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.105.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.106.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.107.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.108.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.109.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.110.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.111.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.112.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.113.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.114.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.115.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.116.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.117.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.118.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.119.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.120.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.121.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.122.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.123.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.124.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.125.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.126.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.127.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.128.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.129.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.130.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.131.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.132.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.133.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.134.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.135.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.136.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.137.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.138.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.139.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.140.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.141.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.142.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.143.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.144.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.145.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.146.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.147.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.148.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.149.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.150.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.151.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.152.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.153.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.154.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.155.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.156.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.157.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.158.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.experts.159.down_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.shared_experts.gate_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.40.mlp.shared_experts.up_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.41.self_attn.o_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.41.input_layernorm.weight": "model-00055-of-00132.safetensors", + "model.layers.41.self_attn.q_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.41.self_attn.k_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.41.self_attn.v_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.41.self_attn.q_proj.bias": "model-00055-of-00132.safetensors", + "model.layers.41.self_attn.k_proj.bias": "model-00055-of-00132.safetensors", + "model.layers.41.self_attn.v_proj.bias": "model-00055-of-00132.safetensors", + "model.layers.41.self_attn.q_norm.weight": "model-00055-of-00132.safetensors", + "model.layers.41.self_attn.k_norm.weight": "model-00055-of-00132.safetensors", + "model.layers.41.post_attention_layernorm.weight": "model-00055-of-00132.safetensors", + "model.layers.41.mlp.gate.e_score_correction_bias": "model-00055-of-00132.safetensors", + "model.layers.41.mlp.experts.0.gate_proj.weight": "model-00055-of-00132.safetensors", + "model.layers.41.mlp.experts.0.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.1.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.1.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.2.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.2.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.3.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.3.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.4.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.4.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.5.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.5.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.6.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.6.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.7.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.7.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.8.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.8.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.9.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.9.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.10.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.10.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.11.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.11.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.12.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.12.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.13.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.13.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.14.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.14.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.15.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.15.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.16.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.16.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.17.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.17.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.18.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.18.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.19.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.19.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.20.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.20.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.21.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.21.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.22.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.22.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.23.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.23.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.24.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.24.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.25.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.25.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.26.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.26.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.27.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.27.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.28.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.28.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.29.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.29.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.30.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.30.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.31.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.31.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.32.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.32.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.33.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.33.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.34.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.34.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.35.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.35.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.36.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.36.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.37.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.37.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.38.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.38.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.39.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.39.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.40.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.40.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.41.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.41.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.42.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.42.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.43.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.43.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.44.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.44.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.45.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.45.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.46.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.46.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.47.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.47.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.48.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.48.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.49.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.49.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.50.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.50.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.51.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.51.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.52.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.52.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.53.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.53.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.54.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.54.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.55.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.55.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.56.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.56.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.57.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.57.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.58.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.58.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.59.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.59.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.60.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.60.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.61.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.61.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.62.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.62.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.63.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.63.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.64.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.64.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.65.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.65.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.66.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.66.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.67.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.67.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.68.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.68.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.69.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.69.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.70.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.70.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.71.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.71.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.72.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.72.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.73.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.73.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.74.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.74.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.75.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.75.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.76.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.76.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.77.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.77.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.78.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.78.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.79.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.79.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.80.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.80.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.81.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.81.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.82.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.82.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.83.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.83.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.84.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.84.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.85.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.85.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.86.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.86.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.87.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.87.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.88.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.88.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.89.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.89.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.90.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.90.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.91.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.91.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.92.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.92.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.93.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.93.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.94.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.94.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.95.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.95.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.96.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.96.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.97.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.97.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.98.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.98.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.99.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.99.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.100.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.100.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.101.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.101.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.102.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.102.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.103.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.103.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.104.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.104.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.105.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.105.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.106.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.106.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.107.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.107.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.108.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.108.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.109.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.109.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.110.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.110.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.111.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.111.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.112.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.112.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.113.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.113.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.114.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.114.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.115.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.115.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.116.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.116.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.117.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.117.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.118.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.118.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.119.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.119.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.120.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.120.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.121.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.121.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.122.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.122.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.123.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.123.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.124.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.124.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.125.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.125.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.126.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.126.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.127.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.127.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.128.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.128.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.129.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.129.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.130.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.130.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.131.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.131.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.132.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.132.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.133.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.133.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.134.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.134.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.135.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.135.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.136.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.136.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.137.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.137.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.138.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.138.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.139.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.139.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.140.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.140.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.141.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.141.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.142.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.142.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.143.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.143.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.144.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.144.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.145.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.145.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.146.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.146.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.147.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.147.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.148.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.148.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.149.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.149.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.150.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.150.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.151.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.151.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.152.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.152.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.153.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.153.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.154.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.154.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.155.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.155.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.156.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.156.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.157.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.157.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.158.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.158.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.159.gate_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.159.up_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.0.down_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.1.down_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.2.down_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.3.down_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.4.down_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.5.down_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.6.down_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.7.down_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.8.down_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.9.down_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.10.down_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.11.down_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.12.down_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.13.down_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.14.down_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.15.down_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.16.down_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.17.down_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.18.down_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.19.down_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.20.down_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.21.down_proj.weight": "model-00056-of-00132.safetensors", + "model.layers.41.mlp.experts.22.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.23.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.24.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.25.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.26.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.27.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.28.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.29.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.30.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.31.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.32.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.33.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.34.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.35.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.36.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.37.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.38.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.39.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.40.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.41.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.42.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.43.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.44.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.45.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.46.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.47.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.48.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.49.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.50.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.51.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.52.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.53.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.54.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.55.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.56.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.57.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.58.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.59.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.60.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.61.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.62.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.63.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.64.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.65.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.66.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.67.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.68.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.69.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.70.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.71.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.72.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.73.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.74.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.75.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.76.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.77.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.78.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.79.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.80.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.81.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.82.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.83.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.84.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.85.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.86.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.87.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.88.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.89.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.90.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.91.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.92.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.93.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.94.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.95.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.96.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.97.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.98.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.99.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.100.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.101.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.102.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.103.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.104.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.105.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.106.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.107.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.108.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.109.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.110.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.111.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.112.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.113.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.114.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.115.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.116.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.117.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.118.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.119.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.120.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.121.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.122.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.123.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.124.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.125.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.126.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.127.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.128.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.129.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.130.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.131.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.132.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.133.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.134.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.135.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.136.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.137.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.138.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.139.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.140.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.141.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.142.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.143.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.144.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.145.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.146.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.147.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.148.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.149.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.150.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.151.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.152.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.153.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.154.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.155.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.156.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.157.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.158.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.experts.159.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.shared_experts.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.shared_experts.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.41.mlp.shared_experts.down_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.input_layernorm.weight": "model-00057-of-00132.safetensors", + "model.layers.42.self_attn.q_proj.bias": "model-00057-of-00132.safetensors", + "model.layers.42.self_attn.k_proj.bias": "model-00057-of-00132.safetensors", + "model.layers.42.self_attn.v_proj.bias": "model-00057-of-00132.safetensors", + "model.layers.42.self_attn.q_norm.weight": "model-00057-of-00132.safetensors", + "model.layers.42.self_attn.k_norm.weight": "model-00057-of-00132.safetensors", + "model.layers.42.post_attention_layernorm.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.gate.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.gate.e_score_correction_bias": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.0.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.0.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.1.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.1.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.2.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.2.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.3.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.3.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.4.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.4.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.5.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.5.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.6.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.6.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.7.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.7.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.8.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.8.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.9.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.9.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.10.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.10.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.11.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.11.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.12.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.12.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.13.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.13.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.14.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.14.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.15.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.15.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.16.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.16.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.17.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.17.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.18.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.18.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.19.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.19.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.20.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.20.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.21.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.21.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.22.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.22.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.23.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.23.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.24.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.24.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.25.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.25.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.26.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.26.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.27.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.27.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.28.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.28.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.29.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.29.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.30.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.30.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.31.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.31.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.32.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.32.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.33.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.33.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.34.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.34.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.35.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.35.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.36.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.36.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.37.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.37.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.38.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.38.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.39.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.39.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.40.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.40.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.41.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.41.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.42.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.42.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.43.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.43.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.44.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.44.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.45.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.45.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.46.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.46.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.47.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.47.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.48.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.48.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.49.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.49.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.50.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.50.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.51.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.51.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.52.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.52.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.53.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.53.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.54.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.54.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.55.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.55.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.56.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.56.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.57.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.57.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.58.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.58.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.59.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.59.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.60.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.60.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.61.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.61.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.62.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.62.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.63.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.63.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.64.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.64.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.65.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.65.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.66.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.66.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.67.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.67.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.68.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.68.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.69.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.69.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.70.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.70.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.71.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.71.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.72.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.72.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.73.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.73.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.74.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.74.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.75.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.75.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.76.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.76.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.77.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.77.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.78.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.78.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.79.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.79.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.80.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.80.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.81.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.81.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.82.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.82.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.83.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.83.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.84.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.84.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.85.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.85.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.86.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.86.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.87.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.87.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.88.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.88.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.89.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.89.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.90.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.90.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.91.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.91.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.92.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.92.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.93.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.93.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.94.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.94.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.95.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.95.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.96.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.96.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.97.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.97.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.98.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.98.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.99.gate_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.99.up_proj.weight": "model-00057-of-00132.safetensors", + "model.layers.42.mlp.experts.100.gate_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.100.up_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.101.gate_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.101.up_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.102.gate_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.102.up_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.103.gate_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.103.up_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.104.gate_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.104.up_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.105.gate_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.105.up_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.106.gate_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.106.up_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.107.gate_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.107.up_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.108.gate_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.108.up_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.109.gate_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.109.up_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.110.gate_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.110.up_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.111.gate_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.111.up_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.112.gate_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.112.up_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.113.gate_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.113.up_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.114.gate_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.114.up_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.115.gate_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.115.up_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.116.gate_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.116.up_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.117.gate_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.117.up_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.118.gate_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.118.up_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.119.gate_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.119.up_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.120.gate_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.120.up_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.121.gate_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.121.up_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.122.gate_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.122.up_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.123.gate_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.123.up_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.124.gate_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.124.up_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.125.gate_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.125.up_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.126.gate_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.126.up_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.127.gate_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.127.up_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.128.gate_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.128.up_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.129.gate_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.129.up_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.130.gate_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.130.up_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.131.gate_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.131.up_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.132.gate_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.132.up_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.133.gate_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.133.up_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.134.gate_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.134.up_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.135.gate_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.135.up_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.136.gate_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.136.up_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.137.gate_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.137.up_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.138.gate_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.138.up_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.139.gate_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.139.up_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.140.gate_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.140.up_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.141.gate_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.141.up_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.142.gate_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.142.up_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.143.gate_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.143.up_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.144.gate_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.144.up_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.145.gate_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.145.up_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.146.gate_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.146.up_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.147.gate_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.147.up_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.148.gate_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.148.up_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.149.gate_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.149.up_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.150.gate_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.150.up_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.151.gate_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.151.up_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.152.gate_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.152.up_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.153.gate_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.153.up_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.154.gate_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.154.up_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.155.gate_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.155.up_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.156.gate_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.156.up_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.157.gate_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.157.up_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.158.gate_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.158.up_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.159.gate_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.159.up_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.0.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.1.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.2.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.3.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.4.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.5.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.6.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.7.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.8.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.9.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.10.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.11.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.12.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.13.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.14.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.15.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.16.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.17.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.18.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.19.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.20.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.21.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.22.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.23.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.24.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.25.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.26.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.27.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.28.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.29.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.30.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.31.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.32.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.33.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.34.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.35.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.36.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.37.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.38.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.39.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.40.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.41.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.42.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.43.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.44.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.45.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.46.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.47.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.48.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.49.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.50.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.51.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.52.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.53.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.54.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.55.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.56.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.57.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.58.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.59.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.60.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.61.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.62.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.63.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.64.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.65.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.66.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.67.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.68.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.69.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.70.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.71.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.72.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.73.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.74.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.75.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.76.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.77.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.78.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.79.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.80.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.81.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.82.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.83.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.84.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.85.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.86.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.87.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.88.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.89.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.90.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.91.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.92.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.93.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.94.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.95.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.96.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.97.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.98.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.99.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.100.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.101.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.102.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.103.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.104.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.105.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.106.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.107.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.108.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.109.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.110.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.111.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.112.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.113.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.114.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.115.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.116.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.117.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.118.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.119.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.120.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.121.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.122.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.123.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.124.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.125.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.126.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.127.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.128.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.129.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.130.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.131.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.132.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.133.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.134.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.135.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.136.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.137.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.138.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.139.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.140.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.141.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.142.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.143.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.144.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.145.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.146.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.147.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.148.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.149.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.150.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.151.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.152.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.153.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.154.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.155.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.156.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.157.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.158.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.experts.159.down_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.shared_experts.gate_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.42.mlp.shared_experts.up_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.43.self_attn.o_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.43.input_layernorm.weight": "model-00058-of-00132.safetensors", + "model.layers.43.self_attn.q_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.43.self_attn.k_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.43.self_attn.v_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.43.self_attn.q_proj.bias": "model-00058-of-00132.safetensors", + "model.layers.43.self_attn.k_proj.bias": "model-00058-of-00132.safetensors", + "model.layers.43.self_attn.v_proj.bias": "model-00058-of-00132.safetensors", + "model.layers.43.self_attn.q_norm.weight": "model-00058-of-00132.safetensors", + "model.layers.43.self_attn.k_norm.weight": "model-00058-of-00132.safetensors", + "model.layers.43.post_attention_layernorm.weight": "model-00058-of-00132.safetensors", + "model.layers.43.mlp.gate.e_score_correction_bias": "model-00058-of-00132.safetensors", + "model.layers.43.mlp.experts.0.gate_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.43.mlp.experts.0.up_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.43.mlp.experts.1.gate_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.43.mlp.experts.1.up_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.43.mlp.experts.2.gate_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.43.mlp.experts.2.up_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.43.mlp.experts.3.gate_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.43.mlp.experts.3.up_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.43.mlp.experts.4.gate_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.43.mlp.experts.4.up_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.43.mlp.experts.5.gate_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.43.mlp.experts.5.up_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.43.mlp.experts.6.gate_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.43.mlp.experts.6.up_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.43.mlp.experts.7.gate_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.43.mlp.experts.7.up_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.43.mlp.experts.8.gate_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.43.mlp.experts.8.up_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.43.mlp.experts.9.gate_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.43.mlp.experts.9.up_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.43.mlp.experts.10.gate_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.43.mlp.experts.10.up_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.43.mlp.experts.11.gate_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.43.mlp.experts.11.up_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.43.mlp.experts.12.gate_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.43.mlp.experts.12.up_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.43.mlp.experts.13.gate_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.43.mlp.experts.13.up_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.43.mlp.experts.14.gate_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.43.mlp.experts.14.up_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.43.mlp.experts.15.gate_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.43.mlp.experts.15.up_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.43.mlp.experts.16.gate_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.43.mlp.experts.16.up_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.43.mlp.experts.17.gate_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.43.mlp.experts.17.up_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.43.mlp.experts.18.gate_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.43.mlp.experts.18.up_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.43.mlp.experts.19.gate_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.43.mlp.experts.19.up_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.43.mlp.experts.20.gate_proj.weight": "model-00058-of-00132.safetensors", + "model.layers.43.mlp.experts.20.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.21.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.21.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.22.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.22.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.23.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.23.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.24.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.24.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.25.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.25.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.26.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.26.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.27.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.27.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.28.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.28.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.29.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.29.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.30.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.30.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.31.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.31.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.32.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.32.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.33.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.33.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.34.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.34.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.35.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.35.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.36.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.36.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.37.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.37.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.38.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.38.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.39.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.39.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.40.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.40.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.41.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.41.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.42.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.42.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.43.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.43.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.44.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.44.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.45.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.45.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.46.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.46.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.47.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.47.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.48.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.48.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.49.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.49.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.50.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.50.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.51.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.51.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.52.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.52.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.53.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.53.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.54.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.54.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.55.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.55.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.56.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.56.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.57.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.57.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.58.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.58.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.59.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.59.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.60.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.60.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.61.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.61.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.62.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.62.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.63.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.63.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.64.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.64.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.65.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.65.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.66.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.66.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.67.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.67.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.68.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.68.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.69.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.69.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.70.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.70.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.71.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.71.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.72.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.72.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.73.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.73.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.74.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.74.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.75.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.75.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.76.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.76.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.77.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.77.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.78.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.78.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.79.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.79.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.80.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.80.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.81.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.81.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.82.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.82.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.83.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.83.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.84.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.84.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.85.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.85.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.86.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.86.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.87.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.87.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.88.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.88.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.89.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.89.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.90.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.90.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.91.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.91.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.92.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.92.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.93.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.93.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.94.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.94.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.95.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.95.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.96.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.96.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.97.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.97.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.98.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.98.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.99.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.99.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.100.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.100.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.101.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.101.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.102.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.102.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.103.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.103.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.104.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.104.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.105.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.105.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.106.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.106.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.107.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.107.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.108.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.108.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.109.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.109.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.110.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.110.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.111.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.111.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.112.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.112.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.113.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.113.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.114.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.114.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.115.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.115.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.116.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.116.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.117.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.117.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.118.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.118.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.119.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.119.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.120.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.120.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.121.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.121.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.122.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.122.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.123.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.123.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.124.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.124.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.125.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.125.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.126.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.126.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.127.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.127.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.128.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.128.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.129.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.129.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.130.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.130.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.131.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.131.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.132.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.132.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.133.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.133.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.134.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.134.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.135.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.135.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.136.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.136.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.137.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.137.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.138.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.138.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.139.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.139.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.140.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.140.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.141.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.141.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.142.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.142.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.143.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.143.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.144.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.144.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.145.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.145.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.146.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.146.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.147.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.147.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.148.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.148.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.149.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.149.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.150.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.150.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.151.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.151.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.152.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.152.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.153.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.153.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.154.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.154.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.155.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.155.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.156.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.156.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.157.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.157.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.158.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.158.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.159.gate_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.159.up_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.0.down_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.1.down_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.2.down_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.3.down_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.4.down_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.5.down_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.6.down_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.7.down_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.8.down_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.9.down_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.10.down_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.11.down_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.12.down_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.13.down_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.14.down_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.15.down_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.16.down_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.17.down_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.18.down_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.19.down_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.20.down_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.21.down_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.22.down_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.23.down_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.24.down_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.25.down_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.26.down_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.27.down_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.28.down_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.29.down_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.30.down_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.31.down_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.32.down_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.33.down_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.34.down_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.35.down_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.36.down_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.37.down_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.38.down_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.39.down_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.40.down_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.41.down_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.42.down_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.43.down_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.44.down_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.45.down_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.46.down_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.47.down_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.48.down_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.49.down_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.50.down_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.51.down_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.52.down_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.53.down_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.54.down_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.55.down_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.56.down_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.57.down_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.58.down_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.59.down_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.60.down_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.61.down_proj.weight": "model-00059-of-00132.safetensors", + "model.layers.43.mlp.experts.62.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.63.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.64.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.65.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.66.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.67.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.68.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.69.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.70.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.71.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.72.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.73.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.74.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.75.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.76.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.77.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.78.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.79.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.80.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.81.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.82.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.83.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.84.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.85.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.86.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.87.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.88.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.89.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.90.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.91.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.92.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.93.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.94.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.95.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.96.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.97.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.98.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.99.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.100.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.101.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.102.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.103.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.104.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.105.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.106.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.107.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.108.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.109.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.110.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.111.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.112.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.113.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.114.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.115.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.116.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.117.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.118.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.119.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.120.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.121.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.122.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.123.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.124.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.125.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.126.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.127.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.128.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.129.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.130.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.131.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.132.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.133.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.134.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.135.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.136.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.137.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.138.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.139.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.140.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.141.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.142.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.143.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.144.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.145.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.146.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.147.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.148.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.149.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.150.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.151.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.152.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.153.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.154.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.155.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.156.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.157.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.158.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.experts.159.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.shared_experts.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.shared_experts.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.43.mlp.shared_experts.down_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.input_layernorm.weight": "model-00060-of-00132.safetensors", + "model.layers.44.self_attn.q_proj.bias": "model-00060-of-00132.safetensors", + "model.layers.44.self_attn.k_proj.bias": "model-00060-of-00132.safetensors", + "model.layers.44.self_attn.v_proj.bias": "model-00060-of-00132.safetensors", + "model.layers.44.self_attn.q_norm.weight": "model-00060-of-00132.safetensors", + "model.layers.44.self_attn.k_norm.weight": "model-00060-of-00132.safetensors", + "model.layers.44.post_attention_layernorm.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.gate.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.gate.e_score_correction_bias": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.0.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.0.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.1.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.1.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.2.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.2.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.3.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.3.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.4.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.4.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.5.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.5.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.6.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.6.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.7.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.7.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.8.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.8.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.9.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.9.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.10.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.10.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.11.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.11.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.12.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.12.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.13.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.13.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.14.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.14.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.15.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.15.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.16.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.16.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.17.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.17.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.18.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.18.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.19.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.19.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.20.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.20.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.21.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.21.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.22.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.22.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.23.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.23.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.24.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.24.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.25.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.25.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.26.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.26.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.27.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.27.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.28.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.28.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.29.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.29.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.30.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.30.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.31.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.31.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.32.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.32.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.33.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.33.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.34.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.34.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.35.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.35.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.36.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.36.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.37.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.37.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.38.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.38.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.39.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.39.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.40.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.40.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.41.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.41.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.42.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.42.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.43.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.43.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.44.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.44.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.45.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.45.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.46.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.46.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.47.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.47.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.48.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.48.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.49.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.49.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.50.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.50.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.51.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.51.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.52.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.52.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.53.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.53.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.54.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.54.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.55.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.55.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.56.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.56.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.57.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.57.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.58.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.58.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.59.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.59.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.60.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.60.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.61.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.61.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.62.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.62.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.63.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.63.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.64.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.64.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.65.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.65.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.66.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.66.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.67.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.67.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.68.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.68.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.69.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.69.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.70.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.70.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.71.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.71.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.72.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.72.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.73.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.73.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.74.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.74.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.75.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.75.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.76.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.76.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.77.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.77.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.78.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.78.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.79.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.79.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.80.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.80.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.81.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.81.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.82.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.82.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.83.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.83.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.84.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.84.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.85.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.85.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.86.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.86.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.87.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.87.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.88.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.88.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.89.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.89.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.90.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.90.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.91.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.91.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.92.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.92.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.93.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.93.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.94.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.94.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.95.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.95.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.96.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.96.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.97.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.97.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.98.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.98.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.99.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.99.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.100.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.100.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.101.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.101.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.102.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.102.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.103.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.103.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.104.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.104.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.105.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.105.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.106.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.106.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.107.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.107.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.108.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.108.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.109.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.109.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.110.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.110.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.111.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.111.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.112.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.112.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.113.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.113.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.114.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.114.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.115.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.115.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.116.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.116.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.117.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.117.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.118.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.118.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.119.gate_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.119.up_proj.weight": "model-00060-of-00132.safetensors", + "model.layers.44.mlp.experts.120.gate_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.120.up_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.121.gate_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.121.up_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.122.gate_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.122.up_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.123.gate_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.123.up_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.124.gate_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.124.up_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.125.gate_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.125.up_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.126.gate_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.126.up_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.127.gate_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.127.up_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.128.gate_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.128.up_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.129.gate_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.129.up_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.130.gate_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.130.up_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.131.gate_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.131.up_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.132.gate_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.132.up_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.133.gate_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.133.up_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.134.gate_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.134.up_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.135.gate_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.135.up_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.136.gate_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.136.up_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.137.gate_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.137.up_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.138.gate_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.138.up_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.139.gate_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.139.up_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.140.gate_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.140.up_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.141.gate_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.141.up_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.142.gate_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.142.up_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.143.gate_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.143.up_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.144.gate_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.144.up_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.145.gate_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.145.up_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.146.gate_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.146.up_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.147.gate_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.147.up_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.148.gate_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.148.up_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.149.gate_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.149.up_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.150.gate_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.150.up_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.151.gate_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.151.up_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.152.gate_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.152.up_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.153.gate_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.153.up_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.154.gate_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.154.up_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.155.gate_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.155.up_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.156.gate_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.156.up_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.157.gate_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.157.up_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.158.gate_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.158.up_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.159.gate_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.159.up_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.0.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.1.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.2.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.3.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.4.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.5.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.6.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.7.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.8.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.9.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.10.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.11.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.12.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.13.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.14.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.15.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.16.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.17.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.18.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.19.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.20.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.21.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.22.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.23.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.24.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.25.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.26.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.27.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.28.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.29.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.30.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.31.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.32.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.33.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.34.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.35.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.36.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.37.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.38.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.39.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.40.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.41.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.42.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.43.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.44.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.45.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.46.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.47.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.48.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.49.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.50.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.51.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.52.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.53.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.54.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.55.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.56.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.57.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.58.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.59.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.60.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.61.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.62.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.63.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.64.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.65.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.66.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.67.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.68.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.69.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.70.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.71.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.72.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.73.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.74.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.75.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.76.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.77.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.78.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.79.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.80.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.81.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.82.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.83.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.84.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.85.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.86.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.87.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.88.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.89.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.90.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.91.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.92.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.93.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.94.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.95.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.96.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.97.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.98.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.99.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.100.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.101.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.102.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.103.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.104.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.105.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.106.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.107.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.108.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.109.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.110.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.111.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.112.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.113.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.114.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.115.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.116.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.117.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.118.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.119.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.120.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.121.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.122.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.123.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.124.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.125.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.126.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.127.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.128.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.129.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.130.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.131.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.132.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.133.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.134.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.135.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.136.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.137.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.138.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.139.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.140.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.141.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.142.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.143.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.144.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.145.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.146.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.147.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.148.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.149.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.150.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.151.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.152.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.153.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.154.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.155.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.156.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.157.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.158.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.experts.159.down_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.shared_experts.gate_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.44.mlp.shared_experts.up_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.self_attn.o_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.input_layernorm.weight": "model-00061-of-00132.safetensors", + "model.layers.45.self_attn.q_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.self_attn.k_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.self_attn.v_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.self_attn.q_proj.bias": "model-00061-of-00132.safetensors", + "model.layers.45.self_attn.k_proj.bias": "model-00061-of-00132.safetensors", + "model.layers.45.self_attn.v_proj.bias": "model-00061-of-00132.safetensors", + "model.layers.45.self_attn.q_norm.weight": "model-00061-of-00132.safetensors", + "model.layers.45.self_attn.k_norm.weight": "model-00061-of-00132.safetensors", + "model.layers.45.post_attention_layernorm.weight": "model-00061-of-00132.safetensors", + "model.layers.45.mlp.gate.e_score_correction_bias": "model-00061-of-00132.safetensors", + "model.layers.45.mlp.experts.0.gate_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.mlp.experts.0.up_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.mlp.experts.1.gate_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.mlp.experts.1.up_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.mlp.experts.2.gate_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.mlp.experts.2.up_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.mlp.experts.3.gate_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.mlp.experts.3.up_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.mlp.experts.4.gate_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.mlp.experts.4.up_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.mlp.experts.5.gate_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.mlp.experts.5.up_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.mlp.experts.6.gate_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.mlp.experts.6.up_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.mlp.experts.7.gate_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.mlp.experts.7.up_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.mlp.experts.8.gate_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.mlp.experts.8.up_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.mlp.experts.9.gate_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.mlp.experts.9.up_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.mlp.experts.10.gate_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.mlp.experts.10.up_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.mlp.experts.11.gate_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.mlp.experts.11.up_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.mlp.experts.12.gate_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.mlp.experts.12.up_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.mlp.experts.13.gate_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.mlp.experts.13.up_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.mlp.experts.14.gate_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.mlp.experts.14.up_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.mlp.experts.15.gate_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.mlp.experts.15.up_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.mlp.experts.16.gate_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.mlp.experts.16.up_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.mlp.experts.17.gate_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.mlp.experts.17.up_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.mlp.experts.18.gate_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.mlp.experts.18.up_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.mlp.experts.19.gate_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.mlp.experts.19.up_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.mlp.experts.20.gate_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.mlp.experts.20.up_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.mlp.experts.21.gate_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.mlp.experts.21.up_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.mlp.experts.22.gate_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.mlp.experts.22.up_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.mlp.experts.23.gate_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.mlp.experts.23.up_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.mlp.experts.24.gate_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.mlp.experts.24.up_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.mlp.experts.25.gate_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.mlp.experts.25.up_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.mlp.experts.26.gate_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.mlp.experts.26.up_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.mlp.experts.27.gate_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.mlp.experts.27.up_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.mlp.experts.28.gate_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.mlp.experts.28.up_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.mlp.experts.29.gate_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.mlp.experts.29.up_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.mlp.experts.30.gate_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.mlp.experts.30.up_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.mlp.experts.31.gate_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.mlp.experts.31.up_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.mlp.experts.32.gate_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.mlp.experts.32.up_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.mlp.experts.33.gate_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.mlp.experts.33.up_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.mlp.experts.34.gate_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.mlp.experts.34.up_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.mlp.experts.35.gate_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.mlp.experts.35.up_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.mlp.experts.36.gate_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.mlp.experts.36.up_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.mlp.experts.37.gate_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.mlp.experts.37.up_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.mlp.experts.38.gate_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.mlp.experts.38.up_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.mlp.experts.39.gate_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.mlp.experts.39.up_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.mlp.experts.40.gate_proj.weight": "model-00061-of-00132.safetensors", + "model.layers.45.mlp.experts.40.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.41.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.41.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.42.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.42.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.43.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.43.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.44.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.44.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.45.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.45.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.46.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.46.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.47.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.47.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.48.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.48.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.49.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.49.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.50.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.50.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.51.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.51.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.52.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.52.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.53.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.53.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.54.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.54.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.55.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.55.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.56.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.56.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.57.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.57.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.58.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.58.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.59.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.59.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.60.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.60.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.61.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.61.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.62.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.62.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.63.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.63.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.64.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.64.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.65.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.65.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.66.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.66.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.67.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.67.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.68.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.68.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.69.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.69.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.70.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.70.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.71.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.71.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.72.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.72.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.73.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.73.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.74.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.74.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.75.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.75.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.76.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.76.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.77.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.77.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.78.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.78.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.79.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.79.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.80.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.80.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.81.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.81.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.82.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.82.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.83.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.83.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.84.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.84.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.85.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.85.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.86.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.86.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.87.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.87.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.88.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.88.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.89.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.89.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.90.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.90.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.91.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.91.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.92.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.92.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.93.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.93.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.94.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.94.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.95.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.95.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.96.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.96.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.97.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.97.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.98.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.98.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.99.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.99.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.100.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.100.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.101.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.101.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.102.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.102.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.103.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.103.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.104.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.104.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.105.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.105.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.106.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.106.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.107.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.107.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.108.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.108.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.109.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.109.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.110.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.110.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.111.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.111.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.112.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.112.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.113.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.113.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.114.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.114.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.115.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.115.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.116.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.116.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.117.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.117.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.118.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.118.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.119.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.119.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.120.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.120.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.121.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.121.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.122.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.122.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.123.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.123.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.124.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.124.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.125.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.125.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.126.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.126.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.127.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.127.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.128.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.128.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.129.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.129.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.130.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.130.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.131.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.131.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.132.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.132.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.133.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.133.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.134.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.134.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.135.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.135.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.136.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.136.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.137.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.137.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.138.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.138.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.139.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.139.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.140.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.140.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.141.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.141.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.142.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.142.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.143.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.143.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.144.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.144.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.145.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.145.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.146.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.146.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.147.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.147.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.148.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.148.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.149.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.149.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.150.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.150.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.151.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.151.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.152.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.152.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.153.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.153.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.154.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.154.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.155.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.155.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.156.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.156.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.157.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.157.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.158.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.158.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.159.gate_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.159.up_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.0.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.1.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.2.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.3.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.4.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.5.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.6.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.7.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.8.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.9.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.10.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.11.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.12.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.13.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.14.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.15.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.16.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.17.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.18.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.19.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.20.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.21.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.22.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.23.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.24.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.25.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.26.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.27.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.28.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.29.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.30.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.31.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.32.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.33.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.34.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.35.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.36.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.37.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.38.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.39.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.40.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.41.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.42.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.43.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.44.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.45.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.46.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.47.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.48.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.49.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.50.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.51.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.52.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.53.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.54.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.55.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.56.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.57.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.58.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.59.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.60.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.61.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.62.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.63.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.64.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.65.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.66.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.67.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.68.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.69.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.70.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.71.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.72.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.73.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.74.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.75.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.76.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.77.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.78.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.79.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.80.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.81.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.82.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.83.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.84.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.85.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.86.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.87.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.88.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.89.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.90.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.91.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.92.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.93.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.94.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.95.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.96.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.97.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.98.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.99.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.100.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.101.down_proj.weight": "model-00062-of-00132.safetensors", + "model.layers.45.mlp.experts.102.down_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.45.mlp.experts.103.down_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.45.mlp.experts.104.down_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.45.mlp.experts.105.down_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.45.mlp.experts.106.down_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.45.mlp.experts.107.down_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.45.mlp.experts.108.down_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.45.mlp.experts.109.down_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.45.mlp.experts.110.down_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.45.mlp.experts.111.down_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.45.mlp.experts.112.down_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.45.mlp.experts.113.down_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.45.mlp.experts.114.down_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.45.mlp.experts.115.down_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.45.mlp.experts.116.down_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.45.mlp.experts.117.down_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.45.mlp.experts.118.down_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.45.mlp.experts.119.down_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.45.mlp.experts.120.down_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.45.mlp.experts.121.down_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.45.mlp.experts.122.down_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.45.mlp.experts.123.down_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.45.mlp.experts.124.down_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.45.mlp.experts.125.down_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.45.mlp.experts.126.down_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.45.mlp.experts.127.down_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.45.mlp.experts.128.down_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.45.mlp.experts.129.down_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.45.mlp.experts.130.down_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.45.mlp.experts.131.down_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.45.mlp.experts.132.down_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.45.mlp.experts.133.down_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.45.mlp.experts.134.down_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.45.mlp.experts.135.down_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.45.mlp.experts.136.down_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.45.mlp.experts.137.down_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.45.mlp.experts.138.down_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.45.mlp.experts.139.down_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.45.mlp.experts.140.down_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.45.mlp.experts.141.down_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.45.mlp.experts.142.down_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.45.mlp.experts.143.down_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.45.mlp.experts.144.down_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.45.mlp.experts.145.down_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.45.mlp.experts.146.down_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.45.mlp.experts.147.down_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.45.mlp.experts.148.down_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.45.mlp.experts.149.down_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.45.mlp.experts.150.down_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.45.mlp.experts.151.down_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.45.mlp.experts.152.down_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.45.mlp.experts.153.down_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.45.mlp.experts.154.down_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.45.mlp.experts.155.down_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.45.mlp.experts.156.down_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.45.mlp.experts.157.down_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.45.mlp.experts.158.down_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.45.mlp.experts.159.down_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.45.mlp.shared_experts.gate_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.45.mlp.shared_experts.up_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.45.mlp.shared_experts.down_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.23.self_attn.o_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.23.mlp.gate.weight": "model-00063-of-00132.safetensors", + "model.layers.23.mlp.shared_experts.gate_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.23.mlp.shared_experts.up_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.24.self_attn.o_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.24.self_attn.q_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.24.self_attn.k_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.24.self_attn.v_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.24.mlp.shared_experts.down_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.25.mlp.gate.weight": "model-00063-of-00132.safetensors", + "model.layers.26.self_attn.o_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.26.self_attn.q_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.26.self_attn.k_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.26.self_attn.v_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.26.mlp.shared_experts.down_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.27.mlp.gate.weight": "model-00063-of-00132.safetensors", + "model.layers.28.self_attn.o_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.28.self_attn.q_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.28.self_attn.k_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.28.self_attn.v_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.28.mlp.shared_experts.down_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.29.mlp.gate.weight": "model-00063-of-00132.safetensors", + "model.layers.30.self_attn.o_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.30.self_attn.q_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.30.self_attn.k_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.30.self_attn.v_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.30.mlp.shared_experts.down_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.31.mlp.gate.weight": "model-00063-of-00132.safetensors", + "model.layers.32.self_attn.o_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.32.self_attn.q_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.32.self_attn.k_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.32.self_attn.v_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.32.mlp.shared_experts.down_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.33.mlp.gate.weight": "model-00063-of-00132.safetensors", + "model.layers.34.self_attn.o_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.34.self_attn.q_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.34.self_attn.k_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.34.self_attn.v_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.34.mlp.shared_experts.down_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.35.mlp.gate.weight": "model-00063-of-00132.safetensors", + "model.layers.36.self_attn.o_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.36.self_attn.q_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.36.self_attn.k_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.36.self_attn.v_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.36.mlp.shared_experts.down_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.37.mlp.gate.weight": "model-00063-of-00132.safetensors", + "model.layers.38.self_attn.o_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.38.self_attn.q_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.38.self_attn.k_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.38.self_attn.v_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.38.mlp.shared_experts.down_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.39.mlp.gate.weight": "model-00063-of-00132.safetensors", + "model.layers.40.self_attn.o_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.40.self_attn.q_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.40.self_attn.k_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.40.self_attn.v_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.40.mlp.shared_experts.down_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.41.mlp.gate.weight": "model-00063-of-00132.safetensors", + "model.layers.42.self_attn.o_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.42.self_attn.q_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.42.self_attn.k_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.42.self_attn.v_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.42.mlp.shared_experts.down_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.43.mlp.gate.weight": "model-00063-of-00132.safetensors", + "model.layers.44.self_attn.o_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.44.self_attn.q_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.44.self_attn.k_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.44.self_attn.v_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.44.mlp.shared_experts.down_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.45.mlp.gate.weight": "model-00063-of-00132.safetensors", + "model.layers.46.input_layernorm.weight": "model-00063-of-00132.safetensors", + "model.layers.46.self_attn.q_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.46.self_attn.k_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.46.self_attn.v_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.46.self_attn.q_proj.bias": "model-00063-of-00132.safetensors", + "model.layers.46.self_attn.k_proj.bias": "model-00063-of-00132.safetensors", + "model.layers.46.self_attn.v_proj.bias": "model-00063-of-00132.safetensors", + "model.layers.46.self_attn.q_norm.weight": "model-00063-of-00132.safetensors", + "model.layers.46.self_attn.k_norm.weight": "model-00063-of-00132.safetensors", + "model.layers.46.post_attention_layernorm.weight": "model-00063-of-00132.safetensors", + "model.layers.46.mlp.gate.e_score_correction_bias": "model-00063-of-00132.safetensors", + "model.layers.46.mlp.experts.0.gate_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.46.mlp.experts.0.up_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.46.mlp.experts.1.gate_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.46.mlp.experts.1.up_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.46.mlp.experts.2.gate_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.46.mlp.experts.2.up_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.46.mlp.experts.3.gate_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.46.mlp.experts.3.up_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.46.mlp.experts.4.gate_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.46.mlp.experts.4.up_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.46.mlp.experts.5.gate_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.46.mlp.experts.5.up_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.46.mlp.experts.6.gate_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.46.mlp.experts.6.up_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.46.mlp.experts.7.gate_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.46.mlp.experts.7.up_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.46.mlp.experts.8.gate_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.46.mlp.experts.8.up_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.46.mlp.experts.9.gate_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.46.mlp.experts.9.up_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.46.mlp.experts.10.gate_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.46.mlp.experts.10.up_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.46.mlp.experts.11.gate_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.46.mlp.experts.11.up_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.46.mlp.experts.12.gate_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.46.mlp.experts.12.up_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.46.mlp.experts.13.gate_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.46.mlp.experts.13.up_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.46.mlp.experts.14.gate_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.46.mlp.experts.14.up_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.46.mlp.experts.15.gate_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.46.mlp.experts.15.up_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.46.mlp.experts.16.gate_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.46.mlp.experts.16.up_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.46.mlp.experts.17.gate_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.46.mlp.experts.17.up_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.46.mlp.experts.18.gate_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.46.mlp.experts.18.up_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.46.mlp.experts.19.gate_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.46.mlp.experts.19.up_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.46.mlp.experts.20.gate_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.46.mlp.experts.20.up_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.46.mlp.experts.21.gate_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.46.mlp.experts.21.up_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.46.mlp.experts.22.gate_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.46.mlp.experts.22.up_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.46.mlp.experts.23.gate_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.46.mlp.experts.23.up_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.46.mlp.experts.24.gate_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.46.mlp.experts.24.up_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.46.mlp.experts.25.gate_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.46.mlp.experts.25.up_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.46.mlp.experts.26.gate_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.46.mlp.experts.26.up_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.46.mlp.experts.27.gate_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.46.mlp.experts.27.up_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.46.mlp.experts.28.gate_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.46.mlp.experts.28.up_proj.weight": "model-00063-of-00132.safetensors", + "model.layers.46.mlp.experts.29.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.29.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.30.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.30.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.31.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.31.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.32.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.32.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.33.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.33.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.34.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.34.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.35.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.35.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.36.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.36.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.37.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.37.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.38.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.38.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.39.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.39.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.40.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.40.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.41.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.41.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.42.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.42.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.43.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.43.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.44.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.44.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.45.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.45.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.46.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.46.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.47.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.47.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.48.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.48.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.49.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.49.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.50.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.50.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.51.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.51.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.52.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.52.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.53.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.53.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.54.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.54.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.55.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.55.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.56.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.56.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.57.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.57.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.58.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.58.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.59.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.59.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.60.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.60.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.61.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.61.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.62.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.62.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.63.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.63.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.64.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.64.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.65.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.65.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.66.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.66.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.67.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.67.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.68.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.68.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.69.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.69.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.70.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.70.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.71.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.71.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.72.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.72.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.73.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.73.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.74.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.74.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.75.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.75.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.76.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.76.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.77.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.77.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.78.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.78.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.79.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.79.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.80.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.80.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.81.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.81.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.82.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.82.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.83.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.83.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.84.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.84.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.85.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.85.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.86.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.86.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.87.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.87.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.88.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.88.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.89.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.89.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.90.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.90.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.91.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.91.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.92.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.92.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.93.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.93.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.94.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.94.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.95.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.95.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.96.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.96.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.97.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.97.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.98.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.98.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.99.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.99.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.100.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.100.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.101.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.101.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.102.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.102.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.103.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.103.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.104.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.104.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.105.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.105.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.106.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.106.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.107.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.107.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.108.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.108.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.109.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.109.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.110.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.110.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.111.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.111.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.112.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.112.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.113.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.113.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.114.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.114.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.115.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.115.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.116.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.116.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.117.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.117.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.118.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.118.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.119.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.119.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.120.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.120.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.121.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.121.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.122.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.122.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.123.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.123.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.124.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.124.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.125.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.125.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.126.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.126.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.127.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.127.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.128.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.128.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.129.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.129.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.130.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.130.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.131.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.131.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.132.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.132.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.133.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.133.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.134.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.134.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.135.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.135.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.136.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.136.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.137.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.137.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.138.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.138.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.139.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.139.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.140.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.140.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.141.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.141.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.142.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.142.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.143.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.143.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.144.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.144.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.145.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.145.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.146.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.146.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.147.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.147.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.148.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.148.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.149.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.149.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.150.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.150.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.151.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.151.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.152.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.152.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.153.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.153.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.154.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.154.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.155.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.155.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.156.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.156.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.157.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.157.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.158.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.158.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.159.gate_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.159.up_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.0.down_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.1.down_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.2.down_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.3.down_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.4.down_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.5.down_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.6.down_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.7.down_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.8.down_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.9.down_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.10.down_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.11.down_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.12.down_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.13.down_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.14.down_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.15.down_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.16.down_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.17.down_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.18.down_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.19.down_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.20.down_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.21.down_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.22.down_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.23.down_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.24.down_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.25.down_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.26.down_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.27.down_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.28.down_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.29.down_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.30.down_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.31.down_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.32.down_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.33.down_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.34.down_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.35.down_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.36.down_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.37.down_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.38.down_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.39.down_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.40.down_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.41.down_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.42.down_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.43.down_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.44.down_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.45.down_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.46.down_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.47.down_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.48.down_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.49.down_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.50.down_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.51.down_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.52.down_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.53.down_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.54.down_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.55.down_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.56.down_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.57.down_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.58.down_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.59.down_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.60.down_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.61.down_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.62.down_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.63.down_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.64.down_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.65.down_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.66.down_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.67.down_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.68.down_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.69.down_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.70.down_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.71.down_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.72.down_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.73.down_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.74.down_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.75.down_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.76.down_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.77.down_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.78.down_proj.weight": "model-00064-of-00132.safetensors", + "model.layers.46.mlp.experts.79.down_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.46.mlp.experts.80.down_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.46.mlp.experts.81.down_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.46.mlp.experts.82.down_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.46.mlp.experts.83.down_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.46.mlp.experts.84.down_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.46.mlp.experts.85.down_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.46.mlp.experts.86.down_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.46.mlp.experts.87.down_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.46.mlp.experts.88.down_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.46.mlp.experts.89.down_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.46.mlp.experts.90.down_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.46.mlp.experts.91.down_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.46.mlp.experts.92.down_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.46.mlp.experts.93.down_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.46.mlp.experts.94.down_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.46.mlp.experts.95.down_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.46.mlp.experts.96.down_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.46.mlp.experts.97.down_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.46.mlp.experts.98.down_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.46.mlp.experts.99.down_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.46.mlp.experts.100.down_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.46.mlp.experts.101.down_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.46.mlp.experts.102.down_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.46.mlp.experts.103.down_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.46.mlp.experts.104.down_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.46.mlp.experts.105.down_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.46.mlp.experts.106.down_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.46.mlp.experts.107.down_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.46.mlp.experts.108.down_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.46.mlp.experts.109.down_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.46.mlp.experts.110.down_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.46.mlp.experts.111.down_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.46.mlp.experts.112.down_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.46.mlp.experts.113.down_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.46.mlp.experts.114.down_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.46.mlp.experts.115.down_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.46.mlp.experts.116.down_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.46.mlp.experts.117.down_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.46.mlp.experts.118.down_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.46.mlp.experts.119.down_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.46.mlp.experts.120.down_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.46.mlp.experts.121.down_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.46.mlp.experts.122.down_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.46.mlp.experts.123.down_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.46.mlp.experts.124.down_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.46.mlp.experts.125.down_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.46.mlp.experts.126.down_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.46.mlp.experts.127.down_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.46.mlp.experts.128.down_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.46.mlp.experts.129.down_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.46.mlp.experts.130.down_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.46.mlp.experts.131.down_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.46.mlp.experts.132.down_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.46.mlp.experts.133.down_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.46.mlp.experts.134.down_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.46.mlp.experts.135.down_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.46.mlp.experts.136.down_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.46.mlp.experts.137.down_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.46.mlp.experts.138.down_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.46.mlp.experts.139.down_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.46.mlp.experts.140.down_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.46.mlp.experts.141.down_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.46.mlp.experts.142.down_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.46.mlp.experts.143.down_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.46.mlp.experts.144.down_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.46.mlp.experts.145.down_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.46.mlp.experts.146.down_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.46.mlp.experts.147.down_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.46.mlp.experts.148.down_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.46.mlp.experts.149.down_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.46.mlp.experts.150.down_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.46.mlp.experts.151.down_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.46.mlp.experts.152.down_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.46.mlp.experts.153.down_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.46.mlp.experts.154.down_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.46.mlp.experts.155.down_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.46.mlp.experts.156.down_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.46.mlp.experts.157.down_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.46.mlp.experts.158.down_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.46.mlp.experts.159.down_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.46.mlp.shared_experts.down_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.input_layernorm.weight": "model-00065-of-00132.safetensors", + "model.layers.47.self_attn.q_proj.bias": "model-00065-of-00132.safetensors", + "model.layers.47.self_attn.k_proj.bias": "model-00065-of-00132.safetensors", + "model.layers.47.self_attn.v_proj.bias": "model-00065-of-00132.safetensors", + "model.layers.47.self_attn.q_norm.weight": "model-00065-of-00132.safetensors", + "model.layers.47.self_attn.k_norm.weight": "model-00065-of-00132.safetensors", + "model.layers.47.post_attention_layernorm.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.gate.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.gate.e_score_correction_bias": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.0.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.0.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.1.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.1.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.2.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.2.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.3.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.3.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.4.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.4.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.5.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.5.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.6.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.6.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.7.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.7.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.8.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.8.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.9.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.9.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.10.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.10.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.11.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.11.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.12.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.12.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.13.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.13.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.14.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.14.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.15.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.15.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.16.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.16.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.17.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.17.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.18.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.18.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.19.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.19.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.20.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.20.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.21.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.21.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.22.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.22.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.23.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.23.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.24.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.24.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.25.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.25.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.26.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.26.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.27.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.27.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.28.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.28.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.29.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.29.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.30.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.30.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.31.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.31.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.32.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.32.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.33.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.33.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.34.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.34.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.35.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.35.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.36.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.36.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.37.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.37.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.38.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.38.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.39.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.39.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.40.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.40.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.41.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.41.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.42.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.42.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.43.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.43.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.44.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.44.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.45.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.45.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.46.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.46.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.47.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.47.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.48.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.48.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.49.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.49.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.50.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.50.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.51.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.51.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.52.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.52.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.53.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.53.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.54.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.54.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.55.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.55.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.56.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.56.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.57.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.57.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.58.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.58.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.59.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.59.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.60.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.60.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.61.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.61.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.62.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.62.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.63.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.63.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.64.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.64.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.65.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.65.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.66.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.66.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.67.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.67.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.68.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.68.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.69.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.69.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.70.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.70.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.71.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.71.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.72.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.72.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.73.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.73.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.74.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.74.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.75.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.75.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.76.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.76.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.77.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.77.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.78.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.78.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.79.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.79.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.80.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.80.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.81.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.81.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.82.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.82.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.83.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.83.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.84.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.84.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.85.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.85.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.86.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.86.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.87.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.87.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.88.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.88.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.89.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.89.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.90.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.90.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.91.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.91.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.92.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.92.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.93.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.93.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.94.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.94.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.95.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.95.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.96.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.96.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.97.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.97.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.98.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.98.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.99.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.99.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.100.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.100.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.101.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.101.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.102.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.102.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.103.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.103.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.104.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.104.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.105.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.105.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.106.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.106.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.107.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.107.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.108.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.108.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.109.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.109.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.110.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.110.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.111.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.111.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.112.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.112.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.113.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.113.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.114.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.114.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.115.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.115.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.116.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.116.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.117.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.117.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.118.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.118.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.119.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.119.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.120.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.120.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.121.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.121.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.122.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.122.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.123.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.123.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.124.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.124.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.125.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.125.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.126.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.126.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.127.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.127.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.128.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.128.up_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.129.gate_proj.weight": "model-00065-of-00132.safetensors", + "model.layers.47.mlp.experts.129.up_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.130.gate_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.130.up_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.131.gate_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.131.up_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.132.gate_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.132.up_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.133.gate_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.133.up_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.134.gate_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.134.up_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.135.gate_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.135.up_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.136.gate_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.136.up_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.137.gate_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.137.up_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.138.gate_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.138.up_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.139.gate_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.139.up_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.140.gate_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.140.up_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.141.gate_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.141.up_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.142.gate_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.142.up_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.143.gate_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.143.up_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.144.gate_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.144.up_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.145.gate_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.145.up_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.146.gate_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.146.up_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.147.gate_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.147.up_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.148.gate_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.148.up_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.149.gate_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.149.up_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.150.gate_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.150.up_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.151.gate_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.151.up_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.152.gate_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.152.up_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.153.gate_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.153.up_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.154.gate_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.154.up_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.155.gate_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.155.up_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.156.gate_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.156.up_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.157.gate_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.157.up_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.158.gate_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.158.up_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.159.gate_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.159.up_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.0.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.1.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.2.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.3.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.4.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.5.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.6.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.7.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.8.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.9.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.10.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.11.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.12.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.13.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.14.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.15.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.16.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.17.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.18.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.19.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.20.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.21.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.22.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.23.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.24.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.25.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.26.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.27.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.28.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.29.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.30.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.31.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.32.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.33.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.34.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.35.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.36.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.37.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.38.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.39.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.40.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.41.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.42.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.43.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.44.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.45.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.46.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.47.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.48.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.49.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.50.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.51.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.52.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.53.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.54.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.55.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.56.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.57.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.58.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.59.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.60.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.61.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.62.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.63.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.64.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.65.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.66.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.67.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.68.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.69.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.70.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.71.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.72.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.73.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.74.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.75.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.76.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.77.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.78.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.79.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.80.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.81.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.82.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.83.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.84.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.85.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.86.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.87.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.88.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.89.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.90.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.91.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.92.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.93.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.94.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.95.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.96.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.97.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.98.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.99.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.100.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.101.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.102.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.103.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.104.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.105.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.106.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.107.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.108.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.109.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.110.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.111.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.112.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.113.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.114.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.115.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.116.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.117.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.118.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.119.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.120.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.121.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.122.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.123.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.124.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.125.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.126.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.127.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.128.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.129.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.130.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.131.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.132.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.133.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.134.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.135.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.136.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.137.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.138.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.139.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.140.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.141.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.142.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.143.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.144.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.145.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.146.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.147.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.148.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.149.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.150.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.151.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.152.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.153.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.154.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.155.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.156.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.157.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.158.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.experts.159.down_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.shared_experts.gate_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.47.mlp.shared_experts.up_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.self_attn.o_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.input_layernorm.weight": "model-00066-of-00132.safetensors", + "model.layers.48.self_attn.q_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.self_attn.k_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.self_attn.v_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.self_attn.q_proj.bias": "model-00066-of-00132.safetensors", + "model.layers.48.self_attn.k_proj.bias": "model-00066-of-00132.safetensors", + "model.layers.48.self_attn.v_proj.bias": "model-00066-of-00132.safetensors", + "model.layers.48.self_attn.q_norm.weight": "model-00066-of-00132.safetensors", + "model.layers.48.self_attn.k_norm.weight": "model-00066-of-00132.safetensors", + "model.layers.48.post_attention_layernorm.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.gate.e_score_correction_bias": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.0.gate_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.0.up_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.1.gate_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.1.up_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.2.gate_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.2.up_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.3.gate_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.3.up_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.4.gate_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.4.up_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.5.gate_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.5.up_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.6.gate_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.6.up_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.7.gate_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.7.up_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.8.gate_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.8.up_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.9.gate_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.9.up_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.10.gate_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.10.up_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.11.gate_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.11.up_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.12.gate_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.12.up_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.13.gate_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.13.up_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.14.gate_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.14.up_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.15.gate_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.15.up_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.16.gate_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.16.up_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.17.gate_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.17.up_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.18.gate_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.18.up_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.19.gate_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.19.up_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.20.gate_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.20.up_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.21.gate_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.21.up_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.22.gate_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.22.up_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.23.gate_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.23.up_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.24.gate_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.24.up_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.25.gate_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.25.up_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.26.gate_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.26.up_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.27.gate_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.27.up_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.28.gate_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.28.up_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.29.gate_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.29.up_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.30.gate_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.30.up_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.31.gate_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.31.up_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.32.gate_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.32.up_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.33.gate_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.33.up_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.34.gate_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.34.up_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.35.gate_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.35.up_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.36.gate_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.36.up_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.37.gate_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.37.up_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.38.gate_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.38.up_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.39.gate_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.39.up_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.40.gate_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.40.up_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.41.gate_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.41.up_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.42.gate_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.42.up_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.43.gate_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.43.up_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.44.gate_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.44.up_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.45.gate_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.45.up_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.46.gate_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.46.up_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.47.gate_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.47.up_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.48.gate_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.48.up_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.49.gate_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.49.up_proj.weight": "model-00066-of-00132.safetensors", + "model.layers.48.mlp.experts.50.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.50.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.51.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.51.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.52.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.52.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.53.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.53.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.54.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.54.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.55.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.55.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.56.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.56.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.57.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.57.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.58.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.58.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.59.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.59.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.60.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.60.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.61.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.61.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.62.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.62.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.63.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.63.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.64.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.64.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.65.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.65.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.66.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.66.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.67.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.67.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.68.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.68.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.69.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.69.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.70.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.70.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.71.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.71.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.72.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.72.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.73.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.73.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.74.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.74.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.75.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.75.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.76.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.76.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.77.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.77.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.78.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.78.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.79.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.79.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.80.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.80.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.81.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.81.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.82.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.82.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.83.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.83.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.84.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.84.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.85.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.85.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.86.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.86.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.87.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.87.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.88.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.88.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.89.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.89.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.90.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.90.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.91.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.91.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.92.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.92.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.93.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.93.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.94.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.94.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.95.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.95.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.96.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.96.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.97.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.97.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.98.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.98.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.99.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.99.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.100.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.100.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.101.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.101.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.102.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.102.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.103.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.103.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.104.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.104.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.105.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.105.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.106.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.106.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.107.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.107.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.108.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.108.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.109.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.109.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.110.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.110.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.111.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.111.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.112.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.112.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.113.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.113.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.114.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.114.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.115.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.115.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.116.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.116.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.117.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.117.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.118.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.118.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.119.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.119.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.120.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.120.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.121.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.121.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.122.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.122.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.123.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.123.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.124.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.124.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.125.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.125.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.126.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.126.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.127.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.127.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.128.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.128.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.129.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.129.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.130.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.130.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.131.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.131.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.132.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.132.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.133.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.133.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.134.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.134.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.135.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.135.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.136.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.136.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.137.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.137.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.138.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.138.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.139.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.139.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.140.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.140.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.141.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.141.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.142.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.142.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.143.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.143.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.144.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.144.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.145.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.145.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.146.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.146.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.147.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.147.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.148.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.148.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.149.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.149.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.150.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.150.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.151.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.151.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.152.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.152.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.153.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.153.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.154.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.154.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.155.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.155.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.156.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.156.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.157.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.157.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.158.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.158.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.159.gate_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.159.up_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.0.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.1.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.2.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.3.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.4.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.5.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.6.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.7.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.8.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.9.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.10.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.11.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.12.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.13.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.14.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.15.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.16.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.17.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.18.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.19.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.20.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.21.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.22.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.23.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.24.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.25.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.26.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.27.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.28.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.29.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.30.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.31.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.32.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.33.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.34.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.35.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.36.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.37.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.38.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.39.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.40.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.41.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.42.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.43.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.44.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.45.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.46.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.47.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.48.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.49.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.50.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.51.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.52.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.53.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.54.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.55.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.56.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.57.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.58.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.59.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.60.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.61.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.62.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.63.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.64.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.65.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.66.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.67.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.68.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.69.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.70.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.71.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.72.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.73.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.74.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.75.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.76.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.77.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.78.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.79.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.80.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.81.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.82.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.83.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.84.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.85.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.86.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.87.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.88.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.89.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.90.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.91.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.92.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.93.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.94.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.95.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.96.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.97.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.98.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.99.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.100.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.101.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.102.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.103.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.104.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.105.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.106.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.107.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.108.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.109.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.110.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.111.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.112.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.113.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.114.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.115.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.116.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.117.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.118.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.119.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.120.down_proj.weight": "model-00067-of-00132.safetensors", + "model.layers.48.mlp.experts.121.down_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.48.mlp.experts.122.down_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.48.mlp.experts.123.down_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.48.mlp.experts.124.down_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.48.mlp.experts.125.down_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.48.mlp.experts.126.down_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.48.mlp.experts.127.down_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.48.mlp.experts.128.down_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.48.mlp.experts.129.down_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.48.mlp.experts.130.down_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.48.mlp.experts.131.down_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.48.mlp.experts.132.down_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.48.mlp.experts.133.down_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.48.mlp.experts.134.down_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.48.mlp.experts.135.down_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.48.mlp.experts.136.down_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.48.mlp.experts.137.down_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.48.mlp.experts.138.down_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.48.mlp.experts.139.down_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.48.mlp.experts.140.down_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.48.mlp.experts.141.down_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.48.mlp.experts.142.down_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.48.mlp.experts.143.down_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.48.mlp.experts.144.down_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.48.mlp.experts.145.down_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.48.mlp.experts.146.down_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.48.mlp.experts.147.down_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.48.mlp.experts.148.down_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.48.mlp.experts.149.down_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.48.mlp.experts.150.down_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.48.mlp.experts.151.down_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.48.mlp.experts.152.down_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.48.mlp.experts.153.down_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.48.mlp.experts.154.down_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.48.mlp.experts.155.down_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.48.mlp.experts.156.down_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.48.mlp.experts.157.down_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.48.mlp.experts.158.down_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.48.mlp.experts.159.down_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.48.mlp.shared_experts.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.48.mlp.shared_experts.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.48.mlp.shared_experts.down_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.input_layernorm.weight": "model-00068-of-00132.safetensors", + "model.layers.49.self_attn.q_proj.bias": "model-00068-of-00132.safetensors", + "model.layers.49.self_attn.k_proj.bias": "model-00068-of-00132.safetensors", + "model.layers.49.self_attn.v_proj.bias": "model-00068-of-00132.safetensors", + "model.layers.49.self_attn.q_norm.weight": "model-00068-of-00132.safetensors", + "model.layers.49.self_attn.k_norm.weight": "model-00068-of-00132.safetensors", + "model.layers.49.post_attention_layernorm.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.gate.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.gate.e_score_correction_bias": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.0.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.0.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.1.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.1.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.2.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.2.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.3.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.3.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.4.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.4.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.5.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.5.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.6.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.6.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.7.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.7.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.8.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.8.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.9.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.9.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.10.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.10.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.11.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.11.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.12.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.12.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.13.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.13.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.14.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.14.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.15.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.15.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.16.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.16.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.17.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.17.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.18.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.18.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.19.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.19.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.20.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.20.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.21.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.21.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.22.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.22.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.23.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.23.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.24.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.24.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.25.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.25.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.26.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.26.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.27.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.27.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.28.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.28.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.29.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.29.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.30.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.30.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.31.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.31.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.32.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.32.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.33.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.33.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.34.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.34.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.35.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.35.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.36.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.36.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.37.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.37.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.38.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.38.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.39.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.39.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.40.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.40.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.41.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.41.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.42.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.42.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.43.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.43.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.44.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.44.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.45.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.45.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.46.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.46.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.47.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.47.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.48.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.48.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.49.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.49.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.50.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.50.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.51.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.51.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.52.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.52.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.53.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.53.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.54.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.54.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.55.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.55.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.56.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.56.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.57.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.57.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.58.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.58.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.59.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.59.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.60.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.60.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.61.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.61.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.62.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.62.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.63.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.63.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.64.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.64.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.65.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.65.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.66.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.66.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.67.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.67.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.68.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.68.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.69.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.69.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.70.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.70.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.71.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.71.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.72.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.72.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.73.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.73.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.74.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.74.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.75.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.75.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.76.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.76.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.77.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.77.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.78.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.78.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.79.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.79.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.80.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.80.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.81.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.81.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.82.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.82.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.83.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.83.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.84.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.84.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.85.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.85.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.86.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.86.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.87.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.87.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.88.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.88.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.89.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.89.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.90.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.90.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.91.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.91.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.92.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.92.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.93.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.93.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.94.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.94.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.95.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.95.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.96.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.96.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.97.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.97.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.98.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.98.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.99.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.99.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.100.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.100.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.101.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.101.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.102.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.102.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.103.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.103.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.104.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.104.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.105.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.105.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.106.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.106.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.107.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.107.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.108.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.108.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.109.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.109.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.110.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.110.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.111.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.111.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.112.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.112.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.113.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.113.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.114.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.114.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.115.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.115.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.116.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.116.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.117.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.117.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.118.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.118.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.119.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.119.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.120.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.120.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.121.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.121.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.122.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.122.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.123.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.123.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.124.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.124.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.125.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.125.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.126.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.126.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.127.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.127.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.128.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.128.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.129.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.129.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.130.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.130.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.131.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.131.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.132.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.132.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.133.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.133.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.134.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.134.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.135.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.135.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.136.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.136.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.137.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.137.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.138.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.138.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.139.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.139.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.140.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.140.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.141.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.141.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.142.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.142.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.143.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.143.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.144.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.144.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.145.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.145.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.146.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.146.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.147.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.147.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.148.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.148.up_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.149.gate_proj.weight": "model-00068-of-00132.safetensors", + "model.layers.49.mlp.experts.149.up_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.150.gate_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.150.up_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.151.gate_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.151.up_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.152.gate_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.152.up_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.153.gate_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.153.up_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.154.gate_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.154.up_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.155.gate_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.155.up_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.156.gate_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.156.up_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.157.gate_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.157.up_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.158.gate_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.158.up_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.159.gate_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.159.up_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.0.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.1.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.2.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.3.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.4.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.5.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.6.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.7.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.8.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.9.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.10.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.11.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.12.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.13.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.14.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.15.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.16.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.17.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.18.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.19.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.20.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.21.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.22.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.23.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.24.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.25.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.26.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.27.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.28.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.29.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.30.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.31.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.32.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.33.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.34.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.35.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.36.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.37.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.38.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.39.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.40.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.41.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.42.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.43.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.44.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.45.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.46.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.47.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.48.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.49.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.50.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.51.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.52.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.53.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.54.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.55.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.56.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.57.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.58.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.59.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.60.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.61.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.62.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.63.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.64.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.65.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.66.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.67.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.68.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.69.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.70.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.71.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.72.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.73.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.74.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.75.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.76.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.77.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.78.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.79.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.80.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.81.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.82.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.83.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.84.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.85.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.86.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.87.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.88.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.89.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.90.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.91.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.92.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.93.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.94.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.95.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.96.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.97.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.98.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.99.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.100.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.101.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.102.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.103.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.104.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.105.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.106.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.107.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.108.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.109.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.110.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.111.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.112.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.113.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.114.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.115.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.116.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.117.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.118.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.119.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.120.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.121.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.122.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.123.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.124.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.125.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.126.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.127.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.128.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.129.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.130.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.131.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.132.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.133.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.134.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.135.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.136.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.137.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.138.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.139.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.140.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.141.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.142.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.143.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.144.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.145.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.146.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.147.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.148.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.149.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.150.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.151.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.152.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.153.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.154.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.155.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.156.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.157.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.158.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.experts.159.down_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.shared_experts.gate_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.49.mlp.shared_experts.up_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.self_attn.o_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.input_layernorm.weight": "model-00069-of-00132.safetensors", + "model.layers.50.self_attn.q_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.self_attn.k_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.self_attn.v_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.self_attn.q_proj.bias": "model-00069-of-00132.safetensors", + "model.layers.50.self_attn.k_proj.bias": "model-00069-of-00132.safetensors", + "model.layers.50.self_attn.v_proj.bias": "model-00069-of-00132.safetensors", + "model.layers.50.self_attn.q_norm.weight": "model-00069-of-00132.safetensors", + "model.layers.50.self_attn.k_norm.weight": "model-00069-of-00132.safetensors", + "model.layers.50.post_attention_layernorm.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.gate.e_score_correction_bias": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.0.gate_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.0.up_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.1.gate_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.1.up_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.2.gate_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.2.up_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.3.gate_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.3.up_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.4.gate_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.4.up_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.5.gate_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.5.up_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.6.gate_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.6.up_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.7.gate_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.7.up_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.8.gate_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.8.up_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.9.gate_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.9.up_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.10.gate_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.10.up_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.11.gate_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.11.up_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.12.gate_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.12.up_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.13.gate_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.13.up_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.14.gate_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.14.up_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.15.gate_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.15.up_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.16.gate_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.16.up_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.17.gate_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.17.up_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.18.gate_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.18.up_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.19.gate_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.19.up_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.20.gate_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.20.up_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.21.gate_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.21.up_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.22.gate_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.22.up_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.23.gate_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.23.up_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.24.gate_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.24.up_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.25.gate_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.25.up_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.26.gate_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.26.up_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.27.gate_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.27.up_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.28.gate_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.28.up_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.29.gate_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.29.up_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.30.gate_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.30.up_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.31.gate_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.31.up_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.32.gate_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.32.up_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.33.gate_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.33.up_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.34.gate_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.34.up_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.35.gate_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.35.up_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.36.gate_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.36.up_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.37.gate_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.37.up_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.38.gate_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.38.up_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.39.gate_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.39.up_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.40.gate_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.40.up_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.41.gate_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.41.up_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.42.gate_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.42.up_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.43.gate_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.43.up_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.44.gate_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.44.up_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.45.gate_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.45.up_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.46.gate_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.46.up_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.47.gate_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.47.up_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.48.gate_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.48.up_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.49.gate_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.49.up_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.50.gate_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.50.up_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.51.gate_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.51.up_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.52.gate_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.52.up_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.53.gate_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.53.up_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.54.gate_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.54.up_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.55.gate_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.55.up_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.56.gate_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.56.up_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.57.gate_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.57.up_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.58.gate_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.58.up_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.59.gate_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.59.up_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.60.gate_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.60.up_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.61.gate_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.61.up_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.62.gate_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.62.up_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.63.gate_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.63.up_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.64.gate_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.64.up_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.65.gate_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.65.up_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.66.gate_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.66.up_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.67.gate_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.67.up_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.68.gate_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.68.up_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.69.gate_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.69.up_proj.weight": "model-00069-of-00132.safetensors", + "model.layers.50.mlp.experts.70.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.70.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.71.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.71.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.72.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.72.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.73.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.73.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.74.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.74.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.75.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.75.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.76.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.76.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.77.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.77.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.78.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.78.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.79.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.79.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.80.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.80.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.81.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.81.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.82.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.82.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.83.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.83.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.84.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.84.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.85.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.85.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.86.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.86.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.87.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.87.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.88.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.88.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.89.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.89.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.90.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.90.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.91.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.91.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.92.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.92.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.93.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.93.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.94.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.94.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.95.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.95.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.96.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.96.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.97.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.97.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.98.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.98.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.99.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.99.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.100.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.100.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.101.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.101.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.102.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.102.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.103.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.103.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.104.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.104.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.105.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.105.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.106.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.106.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.107.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.107.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.108.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.108.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.109.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.109.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.110.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.110.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.111.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.111.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.112.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.112.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.113.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.113.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.114.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.114.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.115.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.115.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.116.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.116.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.117.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.117.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.118.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.118.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.119.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.119.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.120.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.120.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.121.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.121.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.122.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.122.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.123.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.123.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.124.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.124.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.125.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.125.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.126.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.126.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.127.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.127.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.128.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.128.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.129.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.129.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.130.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.130.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.131.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.131.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.132.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.132.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.133.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.133.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.134.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.134.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.135.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.135.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.136.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.136.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.137.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.137.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.138.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.138.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.139.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.139.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.140.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.140.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.141.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.141.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.142.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.142.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.143.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.143.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.144.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.144.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.145.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.145.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.146.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.146.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.147.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.147.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.148.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.148.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.149.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.149.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.150.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.150.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.151.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.151.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.152.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.152.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.153.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.153.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.154.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.154.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.155.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.155.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.156.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.156.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.157.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.157.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.158.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.158.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.159.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.159.up_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.0.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.1.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.2.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.3.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.4.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.5.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.6.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.7.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.8.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.9.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.10.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.11.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.12.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.13.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.14.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.15.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.16.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.17.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.18.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.19.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.20.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.21.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.22.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.23.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.24.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.25.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.26.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.27.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.28.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.29.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.30.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.31.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.32.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.33.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.34.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.35.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.36.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.37.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.38.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.39.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.40.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.41.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.42.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.43.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.44.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.45.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.46.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.47.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.48.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.49.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.50.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.51.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.52.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.53.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.54.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.55.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.56.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.57.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.58.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.59.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.60.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.61.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.62.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.63.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.64.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.65.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.66.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.67.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.68.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.69.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.70.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.71.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.72.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.73.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.74.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.75.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.76.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.77.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.78.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.79.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.80.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.81.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.82.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.83.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.84.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.85.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.86.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.87.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.88.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.89.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.90.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.91.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.92.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.93.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.94.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.95.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.96.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.97.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.98.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.99.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.100.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.101.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.102.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.103.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.104.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.105.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.106.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.107.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.108.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.109.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.110.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.111.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.112.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.113.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.114.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.115.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.116.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.117.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.118.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.119.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.120.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.121.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.122.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.123.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.124.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.125.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.126.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.127.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.128.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.129.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.130.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.131.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.132.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.133.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.134.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.135.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.136.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.137.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.138.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.139.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.140.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.141.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.142.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.143.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.144.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.145.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.146.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.147.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.148.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.149.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.150.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.151.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.152.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.153.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.154.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.155.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.156.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.157.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.158.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.experts.159.down_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.shared_experts.gate_proj.weight": "model-00070-of-00132.safetensors", + "model.layers.50.mlp.shared_experts.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.50.mlp.shared_experts.down_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.input_layernorm.weight": "model-00071-of-00132.safetensors", + "model.layers.51.self_attn.q_proj.bias": "model-00071-of-00132.safetensors", + "model.layers.51.self_attn.k_proj.bias": "model-00071-of-00132.safetensors", + "model.layers.51.self_attn.v_proj.bias": "model-00071-of-00132.safetensors", + "model.layers.51.self_attn.q_norm.weight": "model-00071-of-00132.safetensors", + "model.layers.51.self_attn.k_norm.weight": "model-00071-of-00132.safetensors", + "model.layers.51.post_attention_layernorm.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.gate.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.gate.e_score_correction_bias": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.0.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.0.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.1.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.1.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.2.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.2.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.3.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.3.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.4.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.4.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.5.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.5.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.6.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.6.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.7.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.7.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.8.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.8.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.9.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.9.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.10.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.10.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.11.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.11.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.12.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.12.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.13.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.13.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.14.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.14.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.15.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.15.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.16.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.16.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.17.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.17.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.18.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.18.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.19.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.19.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.20.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.20.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.21.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.21.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.22.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.22.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.23.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.23.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.24.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.24.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.25.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.25.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.26.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.26.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.27.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.27.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.28.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.28.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.29.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.29.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.30.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.30.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.31.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.31.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.32.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.32.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.33.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.33.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.34.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.34.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.35.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.35.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.36.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.36.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.37.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.37.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.38.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.38.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.39.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.39.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.40.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.40.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.41.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.41.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.42.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.42.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.43.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.43.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.44.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.44.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.45.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.45.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.46.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.46.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.47.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.47.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.48.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.48.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.49.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.49.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.50.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.50.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.51.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.51.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.52.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.52.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.53.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.53.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.54.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.54.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.55.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.55.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.56.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.56.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.57.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.57.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.58.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.58.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.59.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.59.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.60.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.60.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.61.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.61.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.62.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.62.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.63.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.63.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.64.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.64.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.65.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.65.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.66.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.66.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.67.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.67.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.68.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.68.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.69.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.69.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.70.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.70.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.71.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.71.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.72.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.72.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.73.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.73.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.74.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.74.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.75.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.75.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.76.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.76.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.77.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.77.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.78.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.78.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.79.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.79.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.80.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.80.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.81.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.81.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.82.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.82.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.83.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.83.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.84.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.84.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.85.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.85.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.86.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.86.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.87.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.87.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.88.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.88.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.89.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.89.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.90.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.90.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.91.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.91.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.92.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.92.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.93.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.93.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.94.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.94.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.95.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.95.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.96.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.96.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.97.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.97.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.98.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.98.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.99.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.99.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.100.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.100.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.101.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.101.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.102.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.102.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.103.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.103.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.104.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.104.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.105.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.105.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.106.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.106.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.107.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.107.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.108.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.108.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.109.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.109.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.110.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.110.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.111.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.111.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.112.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.112.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.113.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.113.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.114.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.114.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.115.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.115.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.116.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.116.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.117.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.117.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.118.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.118.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.119.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.119.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.120.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.120.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.121.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.121.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.122.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.122.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.123.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.123.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.124.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.124.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.125.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.125.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.126.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.126.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.127.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.127.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.128.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.128.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.129.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.129.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.130.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.130.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.131.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.131.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.132.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.132.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.133.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.133.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.134.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.134.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.135.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.135.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.136.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.136.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.137.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.137.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.138.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.138.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.139.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.139.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.140.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.140.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.141.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.141.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.142.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.142.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.143.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.143.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.144.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.144.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.145.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.145.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.146.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.146.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.147.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.147.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.148.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.148.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.149.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.149.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.150.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.150.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.151.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.151.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.152.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.152.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.153.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.153.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.154.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.154.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.155.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.155.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.156.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.156.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.157.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.157.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.158.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.158.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.159.gate_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.159.up_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.0.down_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.1.down_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.2.down_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.3.down_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.4.down_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.5.down_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.6.down_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.7.down_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.8.down_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.9.down_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.10.down_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.11.down_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.12.down_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.13.down_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.14.down_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.15.down_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.16.down_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.17.down_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.18.down_proj.weight": "model-00071-of-00132.safetensors", + "model.layers.51.mlp.experts.19.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.20.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.21.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.22.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.23.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.24.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.25.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.26.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.27.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.28.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.29.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.30.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.31.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.32.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.33.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.34.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.35.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.36.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.37.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.38.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.39.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.40.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.41.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.42.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.43.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.44.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.45.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.46.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.47.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.48.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.49.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.50.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.51.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.52.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.53.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.54.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.55.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.56.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.57.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.58.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.59.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.60.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.61.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.62.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.63.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.64.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.65.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.66.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.67.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.68.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.69.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.70.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.71.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.72.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.73.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.74.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.75.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.76.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.77.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.78.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.79.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.80.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.81.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.82.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.83.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.84.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.85.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.86.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.87.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.88.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.89.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.90.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.91.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.92.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.93.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.94.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.95.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.96.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.97.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.98.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.99.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.100.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.101.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.102.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.103.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.104.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.105.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.106.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.107.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.108.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.109.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.110.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.111.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.112.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.113.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.114.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.115.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.116.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.117.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.118.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.119.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.120.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.121.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.122.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.123.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.124.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.125.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.126.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.127.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.128.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.129.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.130.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.131.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.132.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.133.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.134.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.135.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.136.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.137.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.138.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.139.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.140.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.141.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.142.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.143.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.144.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.145.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.146.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.147.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.148.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.149.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.150.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.151.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.152.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.153.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.154.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.155.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.156.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.157.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.158.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.experts.159.down_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.shared_experts.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.51.mlp.shared_experts.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.self_attn.o_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.input_layernorm.weight": "model-00072-of-00132.safetensors", + "model.layers.52.self_attn.q_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.self_attn.k_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.self_attn.v_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.self_attn.q_proj.bias": "model-00072-of-00132.safetensors", + "model.layers.52.self_attn.k_proj.bias": "model-00072-of-00132.safetensors", + "model.layers.52.self_attn.v_proj.bias": "model-00072-of-00132.safetensors", + "model.layers.52.self_attn.q_norm.weight": "model-00072-of-00132.safetensors", + "model.layers.52.self_attn.k_norm.weight": "model-00072-of-00132.safetensors", + "model.layers.52.post_attention_layernorm.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.gate.e_score_correction_bias": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.0.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.0.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.1.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.1.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.2.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.2.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.3.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.3.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.4.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.4.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.5.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.5.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.6.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.6.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.7.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.7.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.8.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.8.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.9.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.9.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.10.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.10.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.11.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.11.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.12.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.12.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.13.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.13.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.14.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.14.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.15.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.15.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.16.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.16.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.17.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.17.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.18.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.18.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.19.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.19.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.20.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.20.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.21.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.21.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.22.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.22.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.23.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.23.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.24.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.24.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.25.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.25.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.26.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.26.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.27.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.27.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.28.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.28.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.29.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.29.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.30.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.30.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.31.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.31.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.32.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.32.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.33.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.33.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.34.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.34.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.35.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.35.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.36.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.36.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.37.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.37.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.38.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.38.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.39.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.39.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.40.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.40.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.41.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.41.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.42.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.42.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.43.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.43.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.44.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.44.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.45.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.45.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.46.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.46.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.47.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.47.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.48.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.48.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.49.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.49.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.50.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.50.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.51.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.51.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.52.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.52.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.53.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.53.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.54.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.54.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.55.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.55.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.56.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.56.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.57.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.57.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.58.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.58.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.59.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.59.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.60.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.60.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.61.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.61.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.62.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.62.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.63.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.63.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.64.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.64.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.65.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.65.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.66.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.66.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.67.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.67.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.68.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.68.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.69.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.69.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.70.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.70.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.71.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.71.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.72.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.72.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.73.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.73.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.74.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.74.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.75.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.75.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.76.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.76.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.77.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.77.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.78.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.78.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.79.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.79.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.80.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.80.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.81.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.81.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.82.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.82.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.83.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.83.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.84.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.84.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.85.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.85.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.86.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.86.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.87.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.87.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.88.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.88.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.89.gate_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.89.up_proj.weight": "model-00072-of-00132.safetensors", + "model.layers.52.mlp.experts.90.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.90.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.91.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.91.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.92.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.92.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.93.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.93.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.94.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.94.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.95.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.95.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.96.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.96.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.97.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.97.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.98.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.98.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.99.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.99.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.100.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.100.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.101.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.101.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.102.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.102.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.103.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.103.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.104.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.104.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.105.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.105.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.106.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.106.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.107.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.107.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.108.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.108.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.109.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.109.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.110.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.110.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.111.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.111.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.112.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.112.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.113.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.113.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.114.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.114.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.115.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.115.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.116.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.116.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.117.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.117.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.118.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.118.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.119.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.119.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.120.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.120.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.121.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.121.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.122.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.122.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.123.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.123.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.124.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.124.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.125.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.125.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.126.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.126.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.127.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.127.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.128.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.128.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.129.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.129.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.130.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.130.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.131.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.131.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.132.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.132.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.133.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.133.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.134.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.134.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.135.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.135.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.136.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.136.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.137.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.137.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.138.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.138.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.139.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.139.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.140.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.140.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.141.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.141.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.142.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.142.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.143.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.143.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.144.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.144.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.145.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.145.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.146.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.146.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.147.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.147.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.148.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.148.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.149.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.149.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.150.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.150.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.151.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.151.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.152.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.152.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.153.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.153.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.154.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.154.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.155.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.155.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.156.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.156.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.157.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.157.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.158.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.158.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.159.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.159.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.0.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.1.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.2.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.3.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.4.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.5.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.6.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.7.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.8.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.9.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.10.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.11.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.12.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.13.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.14.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.15.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.16.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.17.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.18.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.19.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.20.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.21.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.22.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.23.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.24.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.25.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.26.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.27.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.28.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.29.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.30.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.31.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.32.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.33.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.34.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.35.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.36.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.37.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.38.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.39.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.40.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.41.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.42.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.43.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.44.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.45.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.46.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.47.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.48.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.49.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.50.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.51.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.52.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.53.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.54.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.55.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.56.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.57.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.58.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.59.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.60.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.61.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.62.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.63.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.64.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.65.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.66.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.67.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.68.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.69.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.70.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.71.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.72.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.73.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.74.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.75.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.76.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.77.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.78.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.79.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.80.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.81.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.82.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.83.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.84.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.85.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.86.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.87.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.88.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.89.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.90.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.91.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.92.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.93.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.94.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.95.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.96.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.97.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.98.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.99.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.100.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.101.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.102.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.103.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.104.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.105.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.106.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.107.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.108.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.109.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.110.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.111.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.112.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.113.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.114.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.115.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.116.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.117.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.118.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.119.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.120.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.121.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.122.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.123.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.124.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.125.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.126.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.127.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.128.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.129.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.130.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.131.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.132.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.133.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.134.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.135.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.136.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.137.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.138.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.139.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.140.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.141.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.142.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.143.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.144.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.145.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.146.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.147.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.148.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.149.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.150.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.151.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.152.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.153.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.154.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.155.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.156.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.157.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.158.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.experts.159.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.shared_experts.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.shared_experts.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.52.mlp.shared_experts.down_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.53.input_layernorm.weight": "model-00073-of-00132.safetensors", + "model.layers.53.self_attn.q_proj.bias": "model-00073-of-00132.safetensors", + "model.layers.53.self_attn.k_proj.bias": "model-00073-of-00132.safetensors", + "model.layers.53.self_attn.v_proj.bias": "model-00073-of-00132.safetensors", + "model.layers.53.self_attn.q_norm.weight": "model-00073-of-00132.safetensors", + "model.layers.53.self_attn.k_norm.weight": "model-00073-of-00132.safetensors", + "model.layers.53.post_attention_layernorm.weight": "model-00073-of-00132.safetensors", + "model.layers.53.mlp.gate.weight": "model-00073-of-00132.safetensors", + "model.layers.53.mlp.gate.e_score_correction_bias": "model-00073-of-00132.safetensors", + "model.layers.53.mlp.experts.0.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.53.mlp.experts.0.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.53.mlp.experts.1.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.53.mlp.experts.1.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.53.mlp.experts.2.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.53.mlp.experts.2.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.53.mlp.experts.3.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.53.mlp.experts.3.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.53.mlp.experts.4.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.53.mlp.experts.4.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.53.mlp.experts.5.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.53.mlp.experts.5.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.53.mlp.experts.6.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.53.mlp.experts.6.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.53.mlp.experts.7.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.53.mlp.experts.7.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.53.mlp.experts.8.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.53.mlp.experts.8.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.53.mlp.experts.9.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.53.mlp.experts.9.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.53.mlp.experts.10.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.53.mlp.experts.10.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.53.mlp.experts.11.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.53.mlp.experts.11.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.53.mlp.experts.12.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.53.mlp.experts.12.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.53.mlp.experts.13.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.53.mlp.experts.13.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.53.mlp.experts.14.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.53.mlp.experts.14.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.53.mlp.experts.15.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.53.mlp.experts.15.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.53.mlp.experts.16.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.53.mlp.experts.16.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.53.mlp.experts.17.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.53.mlp.experts.17.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.53.mlp.experts.18.gate_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.53.mlp.experts.18.up_proj.weight": "model-00073-of-00132.safetensors", + "model.layers.53.mlp.experts.19.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.19.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.20.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.20.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.21.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.21.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.22.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.22.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.23.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.23.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.24.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.24.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.25.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.25.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.26.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.26.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.27.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.27.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.28.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.28.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.29.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.29.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.30.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.30.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.31.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.31.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.32.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.32.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.33.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.33.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.34.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.34.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.35.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.35.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.36.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.36.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.37.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.37.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.38.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.38.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.39.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.39.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.40.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.40.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.41.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.41.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.42.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.42.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.43.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.43.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.44.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.44.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.45.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.45.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.46.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.46.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.47.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.47.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.48.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.48.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.49.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.49.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.50.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.50.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.51.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.51.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.52.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.52.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.53.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.53.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.54.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.54.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.55.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.55.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.56.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.56.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.57.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.57.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.58.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.58.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.59.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.59.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.60.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.60.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.61.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.61.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.62.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.62.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.63.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.63.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.64.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.64.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.65.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.65.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.66.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.66.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.67.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.67.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.68.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.68.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.69.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.69.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.70.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.70.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.71.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.71.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.72.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.72.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.73.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.73.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.74.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.74.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.75.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.75.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.76.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.76.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.77.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.77.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.78.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.78.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.79.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.79.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.80.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.80.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.81.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.81.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.82.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.82.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.83.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.83.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.84.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.84.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.85.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.85.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.86.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.86.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.87.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.87.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.88.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.88.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.89.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.89.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.90.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.90.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.91.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.91.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.92.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.92.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.93.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.93.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.94.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.94.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.95.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.95.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.96.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.96.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.97.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.97.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.98.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.98.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.99.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.99.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.100.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.100.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.101.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.101.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.102.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.102.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.103.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.103.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.104.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.104.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.105.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.105.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.106.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.106.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.107.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.107.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.108.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.108.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.109.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.109.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.110.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.110.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.111.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.111.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.112.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.112.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.113.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.113.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.114.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.114.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.115.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.115.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.116.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.116.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.117.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.117.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.118.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.118.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.119.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.119.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.120.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.120.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.121.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.121.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.122.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.122.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.123.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.123.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.124.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.124.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.125.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.125.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.126.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.126.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.127.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.127.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.128.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.128.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.129.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.129.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.130.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.130.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.131.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.131.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.132.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.132.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.133.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.133.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.134.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.134.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.135.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.135.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.136.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.136.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.137.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.137.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.138.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.138.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.139.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.139.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.140.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.140.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.141.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.141.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.142.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.142.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.143.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.143.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.144.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.144.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.145.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.145.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.146.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.146.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.147.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.147.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.148.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.148.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.149.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.149.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.150.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.150.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.151.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.151.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.152.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.152.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.153.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.153.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.154.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.154.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.155.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.155.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.156.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.156.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.157.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.157.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.158.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.158.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.159.gate_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.159.up_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.0.down_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.1.down_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.2.down_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.3.down_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.4.down_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.5.down_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.6.down_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.7.down_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.8.down_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.9.down_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.10.down_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.11.down_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.12.down_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.13.down_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.14.down_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.15.down_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.16.down_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.17.down_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.18.down_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.19.down_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.20.down_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.21.down_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.22.down_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.23.down_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.24.down_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.25.down_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.26.down_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.27.down_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.28.down_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.29.down_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.30.down_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.31.down_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.32.down_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.33.down_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.34.down_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.35.down_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.36.down_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.37.down_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.38.down_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.39.down_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.40.down_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.41.down_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.42.down_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.43.down_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.44.down_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.45.down_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.46.down_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.47.down_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.48.down_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.49.down_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.50.down_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.51.down_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.52.down_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.53.down_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.54.down_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.55.down_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.56.down_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.57.down_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.58.down_proj.weight": "model-00074-of-00132.safetensors", + "model.layers.53.mlp.experts.59.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.60.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.61.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.62.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.63.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.64.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.65.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.66.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.67.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.68.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.69.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.70.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.71.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.72.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.73.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.74.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.75.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.76.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.77.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.78.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.79.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.80.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.81.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.82.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.83.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.84.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.85.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.86.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.87.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.88.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.89.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.90.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.91.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.92.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.93.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.94.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.95.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.96.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.97.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.98.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.99.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.100.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.101.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.102.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.103.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.104.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.105.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.106.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.107.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.108.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.109.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.110.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.111.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.112.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.113.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.114.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.115.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.116.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.117.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.118.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.119.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.120.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.121.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.122.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.123.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.124.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.125.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.126.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.127.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.128.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.129.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.130.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.131.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.132.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.133.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.134.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.135.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.136.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.137.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.138.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.139.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.140.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.141.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.142.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.143.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.144.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.145.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.146.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.147.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.148.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.149.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.150.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.151.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.152.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.153.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.154.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.155.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.156.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.157.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.158.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.experts.159.down_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.shared_experts.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.53.mlp.shared_experts.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.self_attn.o_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.input_layernorm.weight": "model-00075-of-00132.safetensors", + "model.layers.54.self_attn.q_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.self_attn.k_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.self_attn.v_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.self_attn.q_proj.bias": "model-00075-of-00132.safetensors", + "model.layers.54.self_attn.k_proj.bias": "model-00075-of-00132.safetensors", + "model.layers.54.self_attn.v_proj.bias": "model-00075-of-00132.safetensors", + "model.layers.54.self_attn.q_norm.weight": "model-00075-of-00132.safetensors", + "model.layers.54.self_attn.k_norm.weight": "model-00075-of-00132.safetensors", + "model.layers.54.post_attention_layernorm.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.gate.e_score_correction_bias": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.0.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.0.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.1.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.1.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.2.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.2.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.3.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.3.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.4.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.4.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.5.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.5.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.6.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.6.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.7.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.7.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.8.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.8.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.9.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.9.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.10.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.10.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.11.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.11.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.12.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.12.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.13.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.13.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.14.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.14.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.15.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.15.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.16.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.16.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.17.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.17.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.18.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.18.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.19.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.19.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.20.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.20.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.21.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.21.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.22.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.22.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.23.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.23.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.24.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.24.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.25.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.25.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.26.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.26.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.27.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.27.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.28.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.28.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.29.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.29.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.30.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.30.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.31.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.31.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.32.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.32.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.33.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.33.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.34.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.34.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.35.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.35.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.36.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.36.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.37.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.37.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.38.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.38.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.39.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.39.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.40.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.40.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.41.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.41.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.42.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.42.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.43.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.43.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.44.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.44.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.45.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.45.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.46.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.46.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.47.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.47.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.48.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.48.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.49.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.49.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.50.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.50.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.51.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.51.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.52.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.52.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.53.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.53.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.54.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.54.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.55.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.55.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.56.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.56.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.57.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.57.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.58.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.58.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.59.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.59.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.60.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.60.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.61.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.61.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.62.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.62.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.63.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.63.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.64.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.64.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.65.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.65.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.66.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.66.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.67.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.67.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.68.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.68.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.69.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.69.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.70.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.70.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.71.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.71.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.72.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.72.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.73.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.73.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.74.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.74.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.75.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.75.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.76.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.76.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.77.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.77.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.78.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.78.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.79.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.79.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.80.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.80.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.81.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.81.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.82.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.82.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.83.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.83.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.84.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.84.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.85.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.85.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.86.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.86.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.87.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.87.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.88.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.88.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.89.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.89.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.90.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.90.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.91.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.91.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.92.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.92.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.93.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.93.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.94.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.94.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.95.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.95.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.96.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.96.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.97.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.97.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.98.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.98.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.99.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.99.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.100.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.100.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.101.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.101.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.102.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.102.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.103.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.103.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.104.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.104.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.105.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.105.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.106.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.106.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.107.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.107.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.108.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.108.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.109.gate_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.109.up_proj.weight": "model-00075-of-00132.safetensors", + "model.layers.54.mlp.experts.110.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.110.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.111.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.111.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.112.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.112.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.113.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.113.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.114.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.114.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.115.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.115.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.116.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.116.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.117.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.117.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.118.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.118.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.119.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.119.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.120.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.120.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.121.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.121.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.122.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.122.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.123.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.123.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.124.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.124.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.125.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.125.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.126.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.126.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.127.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.127.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.128.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.128.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.129.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.129.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.130.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.130.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.131.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.131.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.132.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.132.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.133.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.133.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.134.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.134.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.135.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.135.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.136.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.136.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.137.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.137.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.138.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.138.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.139.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.139.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.140.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.140.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.141.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.141.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.142.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.142.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.143.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.143.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.144.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.144.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.145.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.145.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.146.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.146.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.147.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.147.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.148.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.148.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.149.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.149.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.150.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.150.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.151.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.151.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.152.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.152.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.153.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.153.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.154.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.154.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.155.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.155.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.156.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.156.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.157.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.157.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.158.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.158.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.159.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.159.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.0.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.1.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.2.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.3.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.4.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.5.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.6.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.7.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.8.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.9.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.10.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.11.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.12.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.13.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.14.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.15.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.16.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.17.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.18.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.19.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.20.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.21.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.22.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.23.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.24.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.25.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.26.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.27.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.28.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.29.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.30.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.31.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.32.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.33.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.34.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.35.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.36.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.37.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.38.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.39.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.40.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.41.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.42.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.43.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.44.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.45.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.46.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.47.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.48.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.49.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.50.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.51.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.52.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.53.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.54.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.55.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.56.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.57.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.58.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.59.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.60.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.61.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.62.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.63.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.64.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.65.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.66.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.67.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.68.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.69.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.70.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.71.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.72.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.73.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.74.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.75.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.76.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.77.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.78.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.79.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.80.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.81.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.82.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.83.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.84.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.85.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.86.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.87.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.88.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.89.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.90.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.91.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.92.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.93.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.94.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.95.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.96.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.97.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.98.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.99.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.100.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.101.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.102.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.103.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.104.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.105.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.106.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.107.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.108.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.109.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.110.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.111.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.112.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.113.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.114.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.115.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.116.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.117.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.118.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.119.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.120.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.121.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.122.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.123.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.124.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.125.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.126.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.127.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.128.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.129.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.130.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.131.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.132.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.133.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.134.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.135.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.136.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.137.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.138.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.139.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.140.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.141.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.142.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.143.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.144.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.145.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.146.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.147.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.148.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.149.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.150.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.151.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.152.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.153.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.154.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.155.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.156.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.157.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.158.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.experts.159.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.shared_experts.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.shared_experts.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.54.mlp.shared_experts.down_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.55.input_layernorm.weight": "model-00076-of-00132.safetensors", + "model.layers.55.self_attn.q_proj.bias": "model-00076-of-00132.safetensors", + "model.layers.55.self_attn.k_proj.bias": "model-00076-of-00132.safetensors", + "model.layers.55.self_attn.v_proj.bias": "model-00076-of-00132.safetensors", + "model.layers.55.self_attn.q_norm.weight": "model-00076-of-00132.safetensors", + "model.layers.55.self_attn.k_norm.weight": "model-00076-of-00132.safetensors", + "model.layers.55.post_attention_layernorm.weight": "model-00076-of-00132.safetensors", + "model.layers.55.mlp.gate.weight": "model-00076-of-00132.safetensors", + "model.layers.55.mlp.gate.e_score_correction_bias": "model-00076-of-00132.safetensors", + "model.layers.55.mlp.experts.0.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.55.mlp.experts.0.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.55.mlp.experts.1.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.55.mlp.experts.1.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.55.mlp.experts.2.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.55.mlp.experts.2.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.55.mlp.experts.3.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.55.mlp.experts.3.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.55.mlp.experts.4.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.55.mlp.experts.4.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.55.mlp.experts.5.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.55.mlp.experts.5.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.55.mlp.experts.6.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.55.mlp.experts.6.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.55.mlp.experts.7.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.55.mlp.experts.7.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.55.mlp.experts.8.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.55.mlp.experts.8.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.55.mlp.experts.9.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.55.mlp.experts.9.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.55.mlp.experts.10.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.55.mlp.experts.10.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.55.mlp.experts.11.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.55.mlp.experts.11.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.55.mlp.experts.12.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.55.mlp.experts.12.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.55.mlp.experts.13.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.55.mlp.experts.13.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.55.mlp.experts.14.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.55.mlp.experts.14.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.55.mlp.experts.15.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.55.mlp.experts.15.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.55.mlp.experts.16.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.55.mlp.experts.16.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.55.mlp.experts.17.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.55.mlp.experts.17.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.55.mlp.experts.18.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.55.mlp.experts.18.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.55.mlp.experts.19.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.55.mlp.experts.19.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.55.mlp.experts.20.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.55.mlp.experts.20.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.55.mlp.experts.21.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.55.mlp.experts.21.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.55.mlp.experts.22.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.55.mlp.experts.22.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.55.mlp.experts.23.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.55.mlp.experts.23.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.55.mlp.experts.24.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.55.mlp.experts.24.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.55.mlp.experts.25.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.55.mlp.experts.25.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.55.mlp.experts.26.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.55.mlp.experts.26.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.55.mlp.experts.27.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.55.mlp.experts.27.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.55.mlp.experts.28.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.55.mlp.experts.28.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.55.mlp.experts.29.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.55.mlp.experts.29.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.55.mlp.experts.30.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.55.mlp.experts.30.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.55.mlp.experts.31.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.55.mlp.experts.31.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.55.mlp.experts.32.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.55.mlp.experts.32.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.55.mlp.experts.33.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.55.mlp.experts.33.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.55.mlp.experts.34.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.55.mlp.experts.34.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.55.mlp.experts.35.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.55.mlp.experts.35.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.55.mlp.experts.36.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.55.mlp.experts.36.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.55.mlp.experts.37.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.55.mlp.experts.37.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.55.mlp.experts.38.gate_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.55.mlp.experts.38.up_proj.weight": "model-00076-of-00132.safetensors", + "model.layers.55.mlp.experts.39.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.39.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.40.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.40.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.41.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.41.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.42.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.42.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.43.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.43.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.44.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.44.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.45.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.45.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.46.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.46.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.47.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.47.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.48.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.48.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.49.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.49.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.50.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.50.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.51.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.51.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.52.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.52.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.53.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.53.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.54.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.54.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.55.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.55.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.56.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.56.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.57.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.57.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.58.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.58.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.59.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.59.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.60.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.60.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.61.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.61.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.62.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.62.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.63.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.63.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.64.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.64.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.65.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.65.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.66.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.66.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.67.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.67.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.68.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.68.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.69.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.69.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.70.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.70.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.71.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.71.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.72.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.72.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.73.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.73.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.74.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.74.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.75.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.75.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.76.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.76.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.77.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.77.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.78.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.78.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.79.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.79.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.80.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.80.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.81.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.81.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.82.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.82.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.83.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.83.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.84.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.84.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.85.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.85.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.86.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.86.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.87.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.87.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.88.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.88.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.89.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.89.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.90.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.90.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.91.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.91.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.92.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.92.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.93.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.93.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.94.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.94.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.95.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.95.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.96.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.96.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.97.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.97.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.98.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.98.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.99.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.99.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.100.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.100.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.101.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.101.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.102.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.102.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.103.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.103.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.104.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.104.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.105.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.105.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.106.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.106.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.107.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.107.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.108.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.108.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.109.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.109.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.110.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.110.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.111.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.111.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.112.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.112.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.113.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.113.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.114.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.114.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.115.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.115.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.116.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.116.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.117.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.117.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.118.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.118.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.119.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.119.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.120.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.120.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.121.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.121.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.122.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.122.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.123.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.123.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.124.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.124.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.125.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.125.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.126.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.126.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.127.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.127.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.128.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.128.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.129.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.129.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.130.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.130.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.131.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.131.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.132.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.132.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.133.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.133.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.134.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.134.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.135.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.135.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.136.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.136.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.137.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.137.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.138.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.138.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.139.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.139.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.140.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.140.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.141.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.141.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.142.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.142.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.143.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.143.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.144.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.144.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.145.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.145.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.146.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.146.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.147.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.147.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.148.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.148.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.149.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.149.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.150.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.150.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.151.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.151.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.152.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.152.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.153.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.153.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.154.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.154.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.155.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.155.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.156.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.156.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.157.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.157.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.158.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.158.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.159.gate_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.159.up_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.0.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.1.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.2.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.3.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.4.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.5.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.6.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.7.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.8.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.9.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.10.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.11.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.12.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.13.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.14.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.15.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.16.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.17.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.18.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.19.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.20.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.21.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.22.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.23.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.24.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.25.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.26.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.27.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.28.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.29.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.30.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.31.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.32.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.33.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.34.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.35.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.36.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.37.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.38.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.39.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.40.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.41.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.42.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.43.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.44.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.45.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.46.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.47.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.48.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.49.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.50.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.51.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.52.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.53.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.54.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.55.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.56.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.57.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.58.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.59.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.60.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.61.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.62.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.63.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.64.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.65.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.66.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.67.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.68.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.69.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.70.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.71.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.72.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.73.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.74.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.75.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.76.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.77.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.78.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.79.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.80.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.81.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.82.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.83.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.84.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.85.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.86.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.87.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.88.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.89.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.90.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.91.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.92.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.93.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.94.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.95.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.96.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.97.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.98.down_proj.weight": "model-00077-of-00132.safetensors", + "model.layers.55.mlp.experts.99.down_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.55.mlp.experts.100.down_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.55.mlp.experts.101.down_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.55.mlp.experts.102.down_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.55.mlp.experts.103.down_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.55.mlp.experts.104.down_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.55.mlp.experts.105.down_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.55.mlp.experts.106.down_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.55.mlp.experts.107.down_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.55.mlp.experts.108.down_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.55.mlp.experts.109.down_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.55.mlp.experts.110.down_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.55.mlp.experts.111.down_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.55.mlp.experts.112.down_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.55.mlp.experts.113.down_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.55.mlp.experts.114.down_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.55.mlp.experts.115.down_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.55.mlp.experts.116.down_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.55.mlp.experts.117.down_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.55.mlp.experts.118.down_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.55.mlp.experts.119.down_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.55.mlp.experts.120.down_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.55.mlp.experts.121.down_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.55.mlp.experts.122.down_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.55.mlp.experts.123.down_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.55.mlp.experts.124.down_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.55.mlp.experts.125.down_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.55.mlp.experts.126.down_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.55.mlp.experts.127.down_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.55.mlp.experts.128.down_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.55.mlp.experts.129.down_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.55.mlp.experts.130.down_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.55.mlp.experts.131.down_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.55.mlp.experts.132.down_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.55.mlp.experts.133.down_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.55.mlp.experts.134.down_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.55.mlp.experts.135.down_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.55.mlp.experts.136.down_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.55.mlp.experts.137.down_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.55.mlp.experts.138.down_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.55.mlp.experts.139.down_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.55.mlp.experts.140.down_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.55.mlp.experts.141.down_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.55.mlp.experts.142.down_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.55.mlp.experts.143.down_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.55.mlp.experts.144.down_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.55.mlp.experts.145.down_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.55.mlp.experts.146.down_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.55.mlp.experts.147.down_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.55.mlp.experts.148.down_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.55.mlp.experts.149.down_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.55.mlp.experts.150.down_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.55.mlp.experts.151.down_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.55.mlp.experts.152.down_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.55.mlp.experts.153.down_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.55.mlp.experts.154.down_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.55.mlp.experts.155.down_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.55.mlp.experts.156.down_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.55.mlp.experts.157.down_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.55.mlp.experts.158.down_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.55.mlp.experts.159.down_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.55.mlp.shared_experts.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.55.mlp.shared_experts.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.self_attn.o_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.input_layernorm.weight": "model-00078-of-00132.safetensors", + "model.layers.56.self_attn.q_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.self_attn.k_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.self_attn.v_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.self_attn.q_proj.bias": "model-00078-of-00132.safetensors", + "model.layers.56.self_attn.k_proj.bias": "model-00078-of-00132.safetensors", + "model.layers.56.self_attn.v_proj.bias": "model-00078-of-00132.safetensors", + "model.layers.56.self_attn.q_norm.weight": "model-00078-of-00132.safetensors", + "model.layers.56.self_attn.k_norm.weight": "model-00078-of-00132.safetensors", + "model.layers.56.post_attention_layernorm.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.gate.e_score_correction_bias": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.0.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.0.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.1.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.1.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.2.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.2.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.3.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.3.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.4.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.4.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.5.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.5.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.6.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.6.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.7.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.7.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.8.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.8.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.9.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.9.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.10.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.10.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.11.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.11.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.12.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.12.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.13.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.13.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.14.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.14.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.15.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.15.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.16.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.16.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.17.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.17.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.18.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.18.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.19.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.19.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.20.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.20.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.21.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.21.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.22.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.22.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.23.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.23.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.24.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.24.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.25.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.25.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.26.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.26.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.27.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.27.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.28.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.28.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.29.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.29.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.30.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.30.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.31.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.31.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.32.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.32.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.33.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.33.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.34.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.34.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.35.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.35.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.36.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.36.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.37.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.37.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.38.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.38.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.39.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.39.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.40.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.40.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.41.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.41.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.42.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.42.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.43.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.43.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.44.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.44.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.45.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.45.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.46.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.46.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.47.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.47.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.48.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.48.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.49.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.49.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.50.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.50.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.51.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.51.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.52.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.52.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.53.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.53.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.54.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.54.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.55.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.55.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.56.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.56.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.57.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.57.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.58.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.58.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.59.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.59.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.60.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.60.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.61.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.61.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.62.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.62.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.63.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.63.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.64.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.64.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.65.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.65.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.66.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.66.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.67.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.67.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.68.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.68.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.69.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.69.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.70.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.70.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.71.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.71.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.72.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.72.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.73.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.73.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.74.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.74.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.75.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.75.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.76.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.76.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.77.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.77.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.78.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.78.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.79.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.79.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.80.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.80.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.81.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.81.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.82.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.82.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.83.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.83.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.84.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.84.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.85.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.85.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.86.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.86.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.87.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.87.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.88.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.88.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.89.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.89.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.90.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.90.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.91.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.91.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.92.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.92.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.93.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.93.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.94.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.94.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.95.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.95.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.96.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.96.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.97.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.97.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.98.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.98.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.99.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.99.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.100.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.100.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.101.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.101.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.102.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.102.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.103.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.103.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.104.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.104.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.105.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.105.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.106.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.106.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.107.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.107.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.108.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.108.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.109.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.109.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.110.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.110.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.111.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.111.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.112.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.112.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.113.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.113.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.114.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.114.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.115.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.115.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.116.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.116.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.117.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.117.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.118.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.118.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.119.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.119.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.120.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.120.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.121.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.121.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.122.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.122.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.123.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.123.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.124.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.124.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.125.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.125.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.126.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.126.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.127.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.127.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.128.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.128.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.129.gate_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.129.up_proj.weight": "model-00078-of-00132.safetensors", + "model.layers.56.mlp.experts.130.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.130.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.131.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.131.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.132.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.132.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.133.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.133.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.134.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.134.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.135.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.135.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.136.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.136.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.137.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.137.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.138.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.138.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.139.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.139.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.140.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.140.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.141.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.141.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.142.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.142.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.143.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.143.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.144.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.144.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.145.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.145.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.146.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.146.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.147.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.147.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.148.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.148.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.149.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.149.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.150.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.150.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.151.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.151.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.152.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.152.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.153.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.153.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.154.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.154.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.155.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.155.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.156.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.156.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.157.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.157.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.158.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.158.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.159.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.159.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.0.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.1.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.2.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.3.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.4.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.5.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.6.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.7.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.8.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.9.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.10.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.11.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.12.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.13.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.14.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.15.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.16.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.17.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.18.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.19.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.20.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.21.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.22.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.23.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.24.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.25.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.26.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.27.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.28.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.29.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.30.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.31.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.32.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.33.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.34.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.35.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.36.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.37.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.38.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.39.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.40.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.41.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.42.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.43.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.44.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.45.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.46.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.47.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.48.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.49.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.50.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.51.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.52.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.53.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.54.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.55.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.56.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.57.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.58.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.59.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.60.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.61.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.62.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.63.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.64.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.65.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.66.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.67.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.68.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.69.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.70.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.71.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.72.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.73.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.74.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.75.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.76.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.77.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.78.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.79.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.80.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.81.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.82.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.83.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.84.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.85.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.86.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.87.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.88.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.89.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.90.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.91.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.92.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.93.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.94.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.95.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.96.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.97.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.98.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.99.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.100.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.101.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.102.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.103.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.104.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.105.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.106.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.107.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.108.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.109.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.110.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.111.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.112.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.113.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.114.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.115.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.116.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.117.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.118.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.119.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.120.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.121.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.122.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.123.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.124.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.125.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.126.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.127.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.128.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.129.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.130.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.131.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.132.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.133.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.134.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.135.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.136.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.137.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.138.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.139.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.140.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.141.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.142.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.143.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.144.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.145.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.146.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.147.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.148.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.149.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.150.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.151.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.152.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.153.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.154.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.155.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.156.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.157.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.158.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.experts.159.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.shared_experts.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.shared_experts.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.56.mlp.shared_experts.down_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.input_layernorm.weight": "model-00079-of-00132.safetensors", + "model.layers.57.self_attn.q_proj.bias": "model-00079-of-00132.safetensors", + "model.layers.57.self_attn.k_proj.bias": "model-00079-of-00132.safetensors", + "model.layers.57.self_attn.v_proj.bias": "model-00079-of-00132.safetensors", + "model.layers.57.self_attn.q_norm.weight": "model-00079-of-00132.safetensors", + "model.layers.57.self_attn.k_norm.weight": "model-00079-of-00132.safetensors", + "model.layers.57.post_attention_layernorm.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.gate.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.gate.e_score_correction_bias": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.0.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.0.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.1.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.1.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.2.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.2.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.3.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.3.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.4.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.4.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.5.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.5.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.6.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.6.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.7.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.7.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.8.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.8.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.9.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.9.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.10.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.10.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.11.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.11.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.12.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.12.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.13.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.13.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.14.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.14.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.15.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.15.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.16.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.16.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.17.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.17.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.18.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.18.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.19.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.19.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.20.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.20.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.21.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.21.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.22.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.22.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.23.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.23.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.24.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.24.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.25.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.25.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.26.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.26.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.27.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.27.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.28.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.28.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.29.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.29.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.30.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.30.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.31.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.31.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.32.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.32.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.33.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.33.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.34.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.34.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.35.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.35.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.36.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.36.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.37.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.37.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.38.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.38.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.39.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.39.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.40.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.40.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.41.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.41.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.42.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.42.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.43.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.43.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.44.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.44.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.45.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.45.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.46.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.46.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.47.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.47.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.48.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.48.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.49.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.49.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.50.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.50.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.51.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.51.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.52.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.52.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.53.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.53.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.54.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.54.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.55.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.55.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.56.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.56.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.57.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.57.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.58.gate_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.58.up_proj.weight": "model-00079-of-00132.safetensors", + "model.layers.57.mlp.experts.59.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.59.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.60.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.60.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.61.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.61.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.62.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.62.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.63.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.63.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.64.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.64.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.65.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.65.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.66.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.66.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.67.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.67.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.68.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.68.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.69.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.69.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.70.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.70.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.71.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.71.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.72.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.72.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.73.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.73.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.74.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.74.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.75.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.75.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.76.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.76.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.77.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.77.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.78.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.78.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.79.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.79.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.80.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.80.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.81.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.81.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.82.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.82.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.83.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.83.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.84.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.84.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.85.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.85.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.86.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.86.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.87.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.87.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.88.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.88.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.89.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.89.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.90.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.90.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.91.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.91.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.92.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.92.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.93.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.93.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.94.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.94.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.95.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.95.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.96.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.96.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.97.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.97.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.98.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.98.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.99.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.99.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.100.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.100.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.101.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.101.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.102.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.102.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.103.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.103.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.104.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.104.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.105.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.105.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.106.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.106.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.107.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.107.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.108.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.108.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.109.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.109.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.110.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.110.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.111.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.111.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.112.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.112.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.113.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.113.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.114.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.114.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.115.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.115.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.116.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.116.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.117.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.117.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.118.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.118.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.119.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.119.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.120.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.120.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.121.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.121.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.122.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.122.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.123.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.123.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.124.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.124.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.125.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.125.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.126.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.126.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.127.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.127.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.128.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.128.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.129.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.129.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.130.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.130.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.131.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.131.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.132.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.132.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.133.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.133.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.134.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.134.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.135.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.135.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.136.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.136.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.137.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.137.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.138.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.138.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.139.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.139.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.140.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.140.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.141.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.141.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.142.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.142.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.143.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.143.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.144.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.144.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.145.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.145.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.146.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.146.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.147.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.147.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.148.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.148.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.149.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.149.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.150.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.150.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.151.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.151.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.152.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.152.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.153.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.153.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.154.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.154.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.155.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.155.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.156.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.156.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.157.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.157.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.158.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.158.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.159.gate_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.159.up_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.0.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.1.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.2.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.3.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.4.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.5.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.6.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.7.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.8.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.9.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.10.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.11.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.12.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.13.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.14.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.15.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.16.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.17.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.18.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.19.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.20.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.21.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.22.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.23.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.24.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.25.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.26.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.27.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.28.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.29.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.30.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.31.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.32.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.33.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.34.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.35.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.36.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.37.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.38.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.39.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.40.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.41.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.42.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.43.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.44.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.45.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.46.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.47.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.48.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.49.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.50.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.51.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.52.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.53.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.54.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.55.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.56.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.57.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.58.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.59.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.60.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.61.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.62.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.63.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.64.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.65.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.66.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.67.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.68.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.69.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.70.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.71.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.72.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.73.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.74.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.75.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.76.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.77.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.78.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.79.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.80.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.81.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.82.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.83.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.84.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.85.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.86.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.87.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.88.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.89.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.90.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.91.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.92.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.93.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.94.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.95.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.96.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.97.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.98.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.99.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.100.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.101.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.102.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.103.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.104.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.105.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.106.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.107.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.108.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.109.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.110.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.111.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.112.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.113.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.114.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.115.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.116.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.117.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.118.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.119.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.120.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.121.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.122.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.123.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.124.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.125.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.126.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.127.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.128.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.129.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.130.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.131.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.132.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.133.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.134.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.135.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.136.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.137.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.138.down_proj.weight": "model-00080-of-00132.safetensors", + "model.layers.57.mlp.experts.139.down_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.57.mlp.experts.140.down_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.57.mlp.experts.141.down_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.57.mlp.experts.142.down_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.57.mlp.experts.143.down_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.57.mlp.experts.144.down_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.57.mlp.experts.145.down_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.57.mlp.experts.146.down_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.57.mlp.experts.147.down_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.57.mlp.experts.148.down_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.57.mlp.experts.149.down_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.57.mlp.experts.150.down_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.57.mlp.experts.151.down_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.57.mlp.experts.152.down_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.57.mlp.experts.153.down_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.57.mlp.experts.154.down_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.57.mlp.experts.155.down_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.57.mlp.experts.156.down_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.57.mlp.experts.157.down_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.57.mlp.experts.158.down_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.57.mlp.experts.159.down_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.57.mlp.shared_experts.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.57.mlp.shared_experts.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.self_attn.o_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.input_layernorm.weight": "model-00081-of-00132.safetensors", + "model.layers.58.self_attn.q_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.self_attn.k_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.self_attn.v_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.self_attn.q_proj.bias": "model-00081-of-00132.safetensors", + "model.layers.58.self_attn.k_proj.bias": "model-00081-of-00132.safetensors", + "model.layers.58.self_attn.v_proj.bias": "model-00081-of-00132.safetensors", + "model.layers.58.self_attn.q_norm.weight": "model-00081-of-00132.safetensors", + "model.layers.58.self_attn.k_norm.weight": "model-00081-of-00132.safetensors", + "model.layers.58.post_attention_layernorm.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.gate.e_score_correction_bias": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.0.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.0.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.1.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.1.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.2.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.2.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.3.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.3.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.4.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.4.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.5.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.5.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.6.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.6.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.7.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.7.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.8.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.8.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.9.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.9.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.10.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.10.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.11.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.11.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.12.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.12.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.13.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.13.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.14.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.14.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.15.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.15.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.16.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.16.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.17.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.17.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.18.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.18.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.19.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.19.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.20.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.20.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.21.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.21.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.22.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.22.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.23.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.23.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.24.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.24.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.25.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.25.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.26.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.26.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.27.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.27.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.28.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.28.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.29.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.29.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.30.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.30.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.31.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.31.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.32.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.32.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.33.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.33.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.34.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.34.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.35.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.35.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.36.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.36.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.37.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.37.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.38.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.38.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.39.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.39.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.40.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.40.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.41.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.41.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.42.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.42.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.43.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.43.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.44.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.44.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.45.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.45.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.46.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.46.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.47.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.47.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.48.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.48.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.49.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.49.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.50.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.50.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.51.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.51.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.52.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.52.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.53.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.53.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.54.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.54.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.55.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.55.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.56.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.56.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.57.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.57.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.58.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.58.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.59.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.59.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.60.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.60.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.61.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.61.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.62.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.62.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.63.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.63.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.64.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.64.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.65.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.65.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.66.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.66.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.67.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.67.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.68.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.68.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.69.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.69.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.70.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.70.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.71.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.71.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.72.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.72.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.73.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.73.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.74.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.74.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.75.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.75.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.76.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.76.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.77.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.77.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.78.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.78.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.79.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.79.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.80.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.80.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.81.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.81.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.82.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.82.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.83.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.83.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.84.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.84.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.85.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.85.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.86.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.86.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.87.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.87.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.88.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.88.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.89.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.89.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.90.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.90.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.91.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.91.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.92.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.92.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.93.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.93.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.94.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.94.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.95.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.95.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.96.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.96.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.97.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.97.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.98.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.98.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.99.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.99.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.100.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.100.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.101.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.101.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.102.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.102.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.103.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.103.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.104.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.104.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.105.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.105.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.106.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.106.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.107.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.107.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.108.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.108.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.109.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.109.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.110.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.110.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.111.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.111.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.112.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.112.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.113.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.113.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.114.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.114.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.115.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.115.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.116.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.116.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.117.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.117.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.118.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.118.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.119.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.119.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.120.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.120.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.121.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.121.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.122.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.122.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.123.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.123.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.124.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.124.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.125.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.125.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.126.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.126.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.127.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.127.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.128.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.128.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.129.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.129.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.130.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.130.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.131.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.131.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.132.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.132.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.133.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.133.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.134.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.134.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.135.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.135.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.136.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.136.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.137.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.137.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.138.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.138.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.139.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.139.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.140.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.140.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.141.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.141.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.142.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.142.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.143.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.143.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.144.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.144.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.145.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.145.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.146.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.146.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.147.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.147.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.148.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.148.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.149.gate_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.149.up_proj.weight": "model-00081-of-00132.safetensors", + "model.layers.58.mlp.experts.150.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.150.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.151.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.151.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.152.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.152.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.153.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.153.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.154.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.154.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.155.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.155.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.156.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.156.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.157.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.157.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.158.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.158.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.159.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.159.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.0.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.1.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.2.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.3.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.4.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.5.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.6.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.7.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.8.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.9.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.10.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.11.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.12.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.13.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.14.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.15.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.16.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.17.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.18.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.19.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.20.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.21.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.22.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.23.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.24.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.25.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.26.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.27.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.28.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.29.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.30.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.31.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.32.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.33.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.34.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.35.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.36.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.37.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.38.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.39.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.40.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.41.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.42.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.43.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.44.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.45.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.46.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.47.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.48.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.49.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.50.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.51.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.52.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.53.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.54.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.55.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.56.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.57.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.58.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.59.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.60.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.61.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.62.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.63.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.64.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.65.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.66.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.67.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.68.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.69.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.70.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.71.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.72.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.73.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.74.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.75.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.76.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.77.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.78.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.79.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.80.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.81.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.82.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.83.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.84.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.85.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.86.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.87.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.88.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.89.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.90.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.91.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.92.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.93.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.94.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.95.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.96.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.97.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.98.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.99.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.100.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.101.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.102.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.103.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.104.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.105.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.106.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.107.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.108.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.109.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.110.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.111.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.112.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.113.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.114.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.115.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.116.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.117.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.118.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.119.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.120.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.121.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.122.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.123.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.124.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.125.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.126.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.127.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.128.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.129.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.130.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.131.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.132.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.133.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.134.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.135.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.136.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.137.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.138.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.139.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.140.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.141.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.142.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.143.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.144.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.145.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.146.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.147.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.148.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.149.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.150.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.151.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.152.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.153.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.154.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.155.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.156.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.157.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.158.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.experts.159.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.shared_experts.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.shared_experts.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.58.mlp.shared_experts.down_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.input_layernorm.weight": "model-00082-of-00132.safetensors", + "model.layers.59.self_attn.q_proj.bias": "model-00082-of-00132.safetensors", + "model.layers.59.self_attn.k_proj.bias": "model-00082-of-00132.safetensors", + "model.layers.59.self_attn.v_proj.bias": "model-00082-of-00132.safetensors", + "model.layers.59.self_attn.q_norm.weight": "model-00082-of-00132.safetensors", + "model.layers.59.self_attn.k_norm.weight": "model-00082-of-00132.safetensors", + "model.layers.59.post_attention_layernorm.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.gate.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.gate.e_score_correction_bias": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.0.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.0.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.1.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.1.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.2.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.2.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.3.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.3.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.4.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.4.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.5.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.5.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.6.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.6.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.7.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.7.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.8.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.8.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.9.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.9.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.10.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.10.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.11.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.11.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.12.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.12.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.13.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.13.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.14.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.14.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.15.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.15.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.16.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.16.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.17.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.17.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.18.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.18.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.19.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.19.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.20.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.20.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.21.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.21.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.22.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.22.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.23.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.23.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.24.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.24.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.25.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.25.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.26.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.26.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.27.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.27.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.28.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.28.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.29.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.29.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.30.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.30.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.31.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.31.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.32.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.32.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.33.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.33.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.34.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.34.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.35.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.35.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.36.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.36.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.37.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.37.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.38.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.38.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.39.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.39.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.40.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.40.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.41.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.41.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.42.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.42.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.43.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.43.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.44.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.44.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.45.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.45.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.46.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.46.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.47.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.47.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.48.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.48.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.49.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.49.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.50.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.50.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.51.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.51.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.52.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.52.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.53.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.53.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.54.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.54.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.55.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.55.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.56.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.56.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.57.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.57.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.58.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.58.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.59.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.59.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.60.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.60.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.61.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.61.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.62.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.62.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.63.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.63.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.64.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.64.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.65.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.65.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.66.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.66.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.67.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.67.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.68.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.68.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.69.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.69.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.70.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.70.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.71.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.71.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.72.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.72.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.73.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.73.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.74.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.74.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.75.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.75.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.76.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.76.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.77.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.77.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.78.gate_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.78.up_proj.weight": "model-00082-of-00132.safetensors", + "model.layers.59.mlp.experts.79.gate_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.79.up_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.80.gate_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.80.up_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.81.gate_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.81.up_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.82.gate_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.82.up_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.83.gate_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.83.up_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.84.gate_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.84.up_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.85.gate_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.85.up_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.86.gate_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.86.up_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.87.gate_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.87.up_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.88.gate_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.88.up_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.89.gate_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.89.up_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.90.gate_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.90.up_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.91.gate_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.91.up_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.92.gate_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.92.up_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.93.gate_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.93.up_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.94.gate_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.94.up_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.95.gate_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.95.up_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.96.gate_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.96.up_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.97.gate_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.97.up_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.98.gate_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.98.up_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.99.gate_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.99.up_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.100.gate_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.100.up_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.101.gate_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.101.up_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.102.gate_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.102.up_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.103.gate_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.103.up_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.104.gate_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.104.up_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.105.gate_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.105.up_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.106.gate_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.106.up_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.107.gate_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.107.up_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.108.gate_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.108.up_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.109.gate_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.109.up_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.110.gate_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.110.up_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.111.gate_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.111.up_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.112.gate_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.112.up_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.113.gate_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.113.up_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.114.gate_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.114.up_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.115.gate_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.115.up_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.116.gate_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.116.up_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.117.gate_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.117.up_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.118.gate_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.118.up_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.119.gate_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.119.up_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.120.gate_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.120.up_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.121.gate_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.121.up_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.122.gate_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.122.up_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.123.gate_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.123.up_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.124.gate_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.124.up_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.125.gate_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.125.up_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.126.gate_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.126.up_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.127.gate_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.127.up_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.128.gate_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.128.up_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.129.gate_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.129.up_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.130.gate_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.130.up_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.131.gate_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.131.up_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.132.gate_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.132.up_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.133.gate_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.133.up_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.134.gate_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.134.up_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.135.gate_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.135.up_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.136.gate_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.136.up_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.137.gate_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.137.up_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.138.gate_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.138.up_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.139.gate_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.139.up_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.140.gate_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.140.up_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.141.gate_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.141.up_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.142.gate_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.142.up_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.143.gate_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.143.up_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.144.gate_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.144.up_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.145.gate_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.145.up_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.146.gate_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.146.up_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.147.gate_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.147.up_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.148.gate_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.148.up_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.149.gate_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.149.up_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.150.gate_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.150.up_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.151.gate_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.151.up_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.152.gate_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.152.up_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.153.gate_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.153.up_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.154.gate_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.154.up_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.155.gate_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.155.up_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.156.gate_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.156.up_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.157.gate_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.157.up_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.158.gate_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.158.up_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.159.gate_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.159.up_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.0.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.1.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.2.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.3.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.4.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.5.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.6.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.7.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.8.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.9.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.10.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.11.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.12.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.13.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.14.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.15.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.16.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.17.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.18.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.19.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.20.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.21.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.22.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.23.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.24.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.25.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.26.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.27.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.28.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.29.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.30.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.31.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.32.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.33.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.34.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.35.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.36.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.37.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.38.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.39.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.40.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.41.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.42.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.43.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.44.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.45.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.46.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.47.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.48.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.49.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.50.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.51.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.52.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.53.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.54.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.55.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.56.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.57.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.58.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.59.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.60.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.61.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.62.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.63.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.64.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.65.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.66.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.67.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.68.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.69.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.70.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.71.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.72.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.73.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.74.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.75.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.76.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.77.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.78.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.79.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.80.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.81.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.82.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.83.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.84.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.85.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.86.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.87.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.88.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.89.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.90.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.91.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.92.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.93.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.94.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.95.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.96.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.97.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.98.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.99.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.100.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.101.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.102.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.103.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.104.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.105.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.106.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.107.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.108.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.109.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.110.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.111.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.112.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.113.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.114.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.115.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.116.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.117.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.118.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.119.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.120.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.121.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.122.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.123.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.124.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.125.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.126.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.127.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.128.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.129.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.130.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.131.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.132.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.133.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.134.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.135.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.136.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.137.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.138.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.139.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.140.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.141.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.142.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.143.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.144.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.145.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.146.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.147.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.148.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.149.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.150.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.151.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.152.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.153.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.154.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.155.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.156.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.157.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.158.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.experts.159.down_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.shared_experts.gate_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.59.mlp.shared_experts.up_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.60.self_attn.o_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.60.input_layernorm.weight": "model-00083-of-00132.safetensors", + "model.layers.60.self_attn.q_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.60.self_attn.k_proj.weight": "model-00083-of-00132.safetensors", + "model.layers.60.self_attn.v_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.self_attn.q_proj.bias": "model-00084-of-00132.safetensors", + "model.layers.60.self_attn.k_proj.bias": "model-00084-of-00132.safetensors", + "model.layers.60.self_attn.v_proj.bias": "model-00084-of-00132.safetensors", + "model.layers.60.self_attn.q_norm.weight": "model-00084-of-00132.safetensors", + "model.layers.60.self_attn.k_norm.weight": "model-00084-of-00132.safetensors", + "model.layers.60.post_attention_layernorm.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.gate.e_score_correction_bias": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.0.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.0.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.1.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.1.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.2.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.2.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.3.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.3.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.4.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.4.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.5.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.5.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.6.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.6.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.7.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.7.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.8.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.8.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.9.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.9.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.10.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.10.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.11.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.11.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.12.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.12.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.13.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.13.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.14.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.14.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.15.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.15.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.16.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.16.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.17.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.17.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.18.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.18.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.19.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.19.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.20.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.20.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.21.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.21.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.22.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.22.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.23.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.23.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.24.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.24.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.25.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.25.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.26.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.26.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.27.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.27.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.28.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.28.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.29.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.29.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.30.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.30.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.31.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.31.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.32.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.32.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.33.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.33.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.34.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.34.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.35.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.35.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.36.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.36.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.37.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.37.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.38.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.38.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.39.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.39.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.40.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.40.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.41.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.41.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.42.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.42.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.43.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.43.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.44.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.44.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.45.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.45.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.46.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.46.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.47.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.47.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.48.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.48.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.49.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.49.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.50.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.50.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.51.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.51.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.52.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.52.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.53.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.53.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.54.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.54.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.55.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.55.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.56.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.56.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.57.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.57.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.58.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.58.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.59.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.59.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.60.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.60.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.61.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.61.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.62.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.62.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.63.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.63.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.64.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.64.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.65.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.65.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.66.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.66.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.67.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.67.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.68.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.68.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.69.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.69.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.70.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.70.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.71.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.71.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.72.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.72.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.73.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.73.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.74.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.74.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.75.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.75.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.76.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.76.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.77.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.77.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.78.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.78.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.79.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.79.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.80.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.80.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.81.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.81.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.82.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.82.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.83.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.83.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.84.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.84.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.85.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.85.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.86.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.86.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.87.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.87.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.88.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.88.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.89.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.89.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.90.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.90.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.91.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.91.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.92.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.92.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.93.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.93.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.94.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.94.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.95.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.95.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.96.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.96.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.97.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.97.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.98.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.98.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.99.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.99.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.100.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.100.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.101.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.101.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.102.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.102.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.103.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.103.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.104.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.104.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.105.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.105.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.106.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.106.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.107.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.107.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.108.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.108.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.109.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.109.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.110.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.110.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.111.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.111.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.112.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.112.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.113.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.113.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.114.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.114.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.115.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.115.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.116.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.116.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.117.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.117.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.118.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.118.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.119.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.119.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.120.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.120.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.121.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.121.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.122.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.122.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.123.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.123.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.124.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.124.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.125.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.125.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.126.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.126.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.127.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.127.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.128.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.128.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.129.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.129.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.130.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.130.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.131.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.131.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.132.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.132.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.133.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.133.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.134.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.134.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.135.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.135.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.136.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.136.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.137.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.137.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.138.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.138.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.139.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.139.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.140.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.140.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.141.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.141.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.142.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.142.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.143.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.143.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.144.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.144.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.145.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.145.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.146.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.146.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.147.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.147.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.148.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.148.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.149.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.149.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.150.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.150.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.151.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.151.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.152.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.152.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.153.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.153.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.154.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.154.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.155.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.155.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.156.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.156.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.157.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.157.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.158.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.158.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.159.gate_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.159.up_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.0.down_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.1.down_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.2.down_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.3.down_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.4.down_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.5.down_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.6.down_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.7.down_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.8.down_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.9.down_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.10.down_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.11.down_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.12.down_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.13.down_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.14.down_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.15.down_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.16.down_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.17.down_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.18.down_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.19.down_proj.weight": "model-00084-of-00132.safetensors", + "model.layers.60.mlp.experts.20.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.21.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.22.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.23.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.24.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.25.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.26.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.27.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.28.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.29.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.30.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.31.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.32.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.33.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.34.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.35.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.36.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.37.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.38.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.39.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.40.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.41.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.42.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.43.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.44.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.45.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.46.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.47.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.48.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.49.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.50.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.51.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.52.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.53.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.54.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.55.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.56.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.57.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.58.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.59.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.60.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.61.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.62.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.63.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.64.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.65.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.66.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.67.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.68.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.69.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.70.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.71.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.72.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.73.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.74.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.75.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.76.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.77.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.78.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.79.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.80.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.81.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.82.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.83.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.84.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.85.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.86.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.87.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.88.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.89.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.90.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.91.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.92.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.93.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.94.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.95.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.96.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.97.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.98.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.99.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.100.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.101.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.102.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.103.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.104.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.105.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.106.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.107.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.108.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.109.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.110.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.111.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.112.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.113.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.114.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.115.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.116.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.117.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.118.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.119.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.120.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.121.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.122.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.123.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.124.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.125.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.126.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.127.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.128.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.129.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.130.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.131.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.132.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.133.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.134.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.135.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.136.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.137.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.138.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.139.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.140.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.141.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.142.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.143.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.144.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.145.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.146.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.147.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.148.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.149.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.150.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.151.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.152.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.153.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.154.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.155.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.156.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.157.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.158.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.experts.159.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.shared_experts.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.shared_experts.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.60.mlp.shared_experts.down_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.input_layernorm.weight": "model-00085-of-00132.safetensors", + "model.layers.61.self_attn.q_proj.bias": "model-00085-of-00132.safetensors", + "model.layers.61.self_attn.k_proj.bias": "model-00085-of-00132.safetensors", + "model.layers.61.self_attn.v_proj.bias": "model-00085-of-00132.safetensors", + "model.layers.61.self_attn.q_norm.weight": "model-00085-of-00132.safetensors", + "model.layers.61.self_attn.k_norm.weight": "model-00085-of-00132.safetensors", + "model.layers.61.post_attention_layernorm.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.gate.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.gate.e_score_correction_bias": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.0.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.0.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.1.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.1.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.2.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.2.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.3.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.3.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.4.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.4.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.5.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.5.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.6.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.6.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.7.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.7.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.8.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.8.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.9.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.9.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.10.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.10.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.11.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.11.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.12.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.12.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.13.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.13.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.14.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.14.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.15.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.15.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.16.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.16.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.17.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.17.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.18.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.18.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.19.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.19.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.20.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.20.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.21.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.21.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.22.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.22.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.23.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.23.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.24.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.24.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.25.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.25.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.26.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.26.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.27.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.27.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.28.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.28.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.29.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.29.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.30.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.30.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.31.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.31.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.32.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.32.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.33.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.33.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.34.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.34.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.35.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.35.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.36.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.36.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.37.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.37.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.38.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.38.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.39.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.39.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.40.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.40.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.41.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.41.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.42.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.42.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.43.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.43.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.44.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.44.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.45.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.45.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.46.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.46.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.47.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.47.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.48.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.48.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.49.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.49.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.50.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.50.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.51.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.51.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.52.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.52.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.53.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.53.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.54.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.54.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.55.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.55.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.56.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.56.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.57.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.57.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.58.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.58.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.59.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.59.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.60.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.60.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.61.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.61.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.62.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.62.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.63.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.63.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.64.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.64.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.65.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.65.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.66.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.66.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.67.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.67.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.68.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.68.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.69.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.69.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.70.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.70.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.71.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.71.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.72.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.72.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.73.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.73.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.74.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.74.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.75.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.75.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.76.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.76.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.77.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.77.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.78.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.78.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.79.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.79.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.80.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.80.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.81.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.81.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.82.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.82.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.83.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.83.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.84.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.84.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.85.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.85.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.86.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.86.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.87.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.87.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.88.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.88.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.89.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.89.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.90.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.90.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.91.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.91.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.92.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.92.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.93.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.93.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.94.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.94.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.95.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.95.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.96.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.96.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.97.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.97.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.98.gate_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.98.up_proj.weight": "model-00085-of-00132.safetensors", + "model.layers.61.mlp.experts.99.gate_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.99.up_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.100.gate_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.100.up_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.101.gate_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.101.up_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.102.gate_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.102.up_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.103.gate_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.103.up_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.104.gate_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.104.up_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.105.gate_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.105.up_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.106.gate_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.106.up_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.107.gate_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.107.up_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.108.gate_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.108.up_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.109.gate_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.109.up_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.110.gate_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.110.up_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.111.gate_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.111.up_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.112.gate_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.112.up_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.113.gate_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.113.up_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.114.gate_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.114.up_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.115.gate_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.115.up_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.116.gate_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.116.up_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.117.gate_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.117.up_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.118.gate_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.118.up_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.119.gate_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.119.up_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.120.gate_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.120.up_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.121.gate_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.121.up_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.122.gate_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.122.up_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.123.gate_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.123.up_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.124.gate_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.124.up_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.125.gate_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.125.up_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.126.gate_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.126.up_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.127.gate_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.127.up_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.128.gate_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.128.up_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.129.gate_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.129.up_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.130.gate_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.130.up_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.131.gate_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.131.up_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.132.gate_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.132.up_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.133.gate_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.133.up_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.134.gate_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.134.up_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.135.gate_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.135.up_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.136.gate_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.136.up_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.137.gate_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.137.up_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.138.gate_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.138.up_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.139.gate_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.139.up_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.140.gate_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.140.up_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.141.gate_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.141.up_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.142.gate_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.142.up_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.143.gate_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.143.up_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.144.gate_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.144.up_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.145.gate_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.145.up_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.146.gate_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.146.up_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.147.gate_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.147.up_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.148.gate_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.148.up_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.149.gate_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.149.up_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.150.gate_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.150.up_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.151.gate_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.151.up_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.152.gate_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.152.up_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.153.gate_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.153.up_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.154.gate_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.154.up_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.155.gate_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.155.up_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.156.gate_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.156.up_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.157.gate_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.157.up_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.158.gate_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.158.up_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.159.gate_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.159.up_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.0.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.1.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.2.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.3.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.4.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.5.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.6.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.7.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.8.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.9.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.10.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.11.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.12.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.13.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.14.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.15.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.16.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.17.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.18.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.19.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.20.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.21.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.22.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.23.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.24.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.25.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.26.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.27.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.28.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.29.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.30.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.31.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.32.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.33.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.34.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.35.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.36.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.37.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.38.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.39.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.40.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.41.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.42.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.43.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.44.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.45.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.46.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.47.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.48.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.49.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.50.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.51.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.52.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.53.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.54.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.55.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.56.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.57.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.58.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.59.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.60.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.61.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.62.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.63.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.64.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.65.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.66.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.67.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.68.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.69.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.70.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.71.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.72.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.73.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.74.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.75.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.76.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.77.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.78.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.79.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.80.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.81.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.82.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.83.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.84.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.85.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.86.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.87.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.88.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.89.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.90.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.91.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.92.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.93.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.94.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.95.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.96.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.97.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.98.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.99.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.100.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.101.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.102.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.103.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.104.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.105.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.106.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.107.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.108.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.109.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.110.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.111.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.112.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.113.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.114.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.115.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.116.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.117.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.118.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.119.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.120.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.121.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.122.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.123.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.124.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.125.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.126.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.127.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.128.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.129.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.130.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.131.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.132.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.133.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.134.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.135.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.136.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.137.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.138.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.139.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.140.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.141.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.142.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.143.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.144.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.145.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.146.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.147.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.148.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.149.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.150.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.151.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.152.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.153.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.154.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.155.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.156.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.157.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.158.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.experts.159.down_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.shared_experts.gate_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.61.mlp.shared_experts.up_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.62.self_attn.o_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.62.input_layernorm.weight": "model-00086-of-00132.safetensors", + "model.layers.62.self_attn.q_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.62.self_attn.k_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.62.self_attn.v_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.62.self_attn.q_proj.bias": "model-00086-of-00132.safetensors", + "model.layers.62.self_attn.k_proj.bias": "model-00086-of-00132.safetensors", + "model.layers.62.self_attn.v_proj.bias": "model-00086-of-00132.safetensors", + "model.layers.62.self_attn.q_norm.weight": "model-00086-of-00132.safetensors", + "model.layers.62.self_attn.k_norm.weight": "model-00086-of-00132.safetensors", + "model.layers.62.post_attention_layernorm.weight": "model-00086-of-00132.safetensors", + "model.layers.62.mlp.gate.e_score_correction_bias": "model-00086-of-00132.safetensors", + "model.layers.62.mlp.experts.0.gate_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.62.mlp.experts.0.up_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.62.mlp.experts.1.gate_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.62.mlp.experts.1.up_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.62.mlp.experts.2.gate_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.62.mlp.experts.2.up_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.62.mlp.experts.3.gate_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.62.mlp.experts.3.up_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.62.mlp.experts.4.gate_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.62.mlp.experts.4.up_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.62.mlp.experts.5.gate_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.62.mlp.experts.5.up_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.62.mlp.experts.6.gate_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.62.mlp.experts.6.up_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.62.mlp.experts.7.gate_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.62.mlp.experts.7.up_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.62.mlp.experts.8.gate_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.62.mlp.experts.8.up_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.62.mlp.experts.9.gate_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.62.mlp.experts.9.up_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.62.mlp.experts.10.gate_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.62.mlp.experts.10.up_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.62.mlp.experts.11.gate_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.62.mlp.experts.11.up_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.62.mlp.experts.12.gate_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.62.mlp.experts.12.up_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.62.mlp.experts.13.gate_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.62.mlp.experts.13.up_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.62.mlp.experts.14.gate_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.62.mlp.experts.14.up_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.62.mlp.experts.15.gate_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.62.mlp.experts.15.up_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.62.mlp.experts.16.gate_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.62.mlp.experts.16.up_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.62.mlp.experts.17.gate_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.62.mlp.experts.17.up_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.62.mlp.experts.18.gate_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.62.mlp.experts.18.up_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.62.mlp.experts.19.gate_proj.weight": "model-00086-of-00132.safetensors", + "model.layers.62.mlp.experts.19.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.20.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.20.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.21.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.21.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.22.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.22.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.23.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.23.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.24.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.24.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.25.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.25.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.26.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.26.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.27.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.27.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.28.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.28.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.29.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.29.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.30.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.30.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.31.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.31.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.32.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.32.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.33.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.33.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.34.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.34.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.35.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.35.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.36.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.36.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.37.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.37.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.38.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.38.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.39.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.39.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.40.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.40.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.41.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.41.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.42.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.42.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.43.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.43.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.44.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.44.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.45.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.45.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.46.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.46.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.47.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.47.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.48.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.48.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.49.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.49.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.50.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.50.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.51.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.51.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.52.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.52.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.53.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.53.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.54.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.54.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.55.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.55.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.56.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.56.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.57.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.57.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.58.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.58.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.59.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.59.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.60.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.60.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.61.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.61.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.62.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.62.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.63.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.63.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.64.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.64.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.65.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.65.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.66.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.66.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.67.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.67.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.68.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.68.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.69.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.69.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.70.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.70.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.71.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.71.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.72.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.72.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.73.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.73.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.74.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.74.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.75.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.75.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.76.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.76.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.77.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.77.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.78.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.78.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.79.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.79.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.80.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.80.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.81.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.81.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.82.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.82.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.83.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.83.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.84.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.84.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.85.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.85.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.86.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.86.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.87.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.87.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.88.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.88.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.89.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.89.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.90.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.90.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.91.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.91.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.92.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.92.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.93.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.93.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.94.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.94.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.95.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.95.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.96.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.96.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.97.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.97.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.98.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.98.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.99.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.99.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.100.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.100.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.101.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.101.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.102.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.102.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.103.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.103.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.104.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.104.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.105.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.105.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.106.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.106.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.107.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.107.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.108.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.108.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.109.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.109.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.110.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.110.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.111.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.111.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.112.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.112.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.113.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.113.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.114.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.114.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.115.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.115.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.116.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.116.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.117.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.117.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.118.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.118.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.119.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.119.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.120.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.120.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.121.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.121.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.122.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.122.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.123.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.123.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.124.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.124.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.125.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.125.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.126.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.126.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.127.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.127.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.128.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.128.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.129.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.129.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.130.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.130.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.131.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.131.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.132.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.132.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.133.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.133.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.134.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.134.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.135.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.135.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.136.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.136.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.137.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.137.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.138.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.138.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.139.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.139.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.140.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.140.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.141.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.141.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.142.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.142.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.143.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.143.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.144.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.144.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.145.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.145.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.146.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.146.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.147.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.147.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.148.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.148.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.149.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.149.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.150.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.150.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.151.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.151.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.152.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.152.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.153.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.153.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.154.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.154.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.155.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.155.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.156.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.156.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.157.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.157.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.158.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.158.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.159.gate_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.159.up_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.0.down_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.1.down_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.2.down_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.3.down_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.4.down_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.5.down_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.6.down_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.7.down_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.8.down_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.9.down_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.10.down_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.11.down_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.12.down_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.13.down_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.14.down_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.15.down_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.16.down_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.17.down_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.18.down_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.19.down_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.20.down_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.21.down_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.22.down_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.23.down_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.24.down_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.25.down_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.26.down_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.27.down_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.28.down_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.29.down_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.30.down_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.31.down_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.32.down_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.33.down_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.34.down_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.35.down_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.36.down_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.37.down_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.38.down_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.39.down_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.40.down_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.41.down_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.42.down_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.43.down_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.44.down_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.45.down_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.46.down_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.47.down_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.48.down_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.49.down_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.50.down_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.51.down_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.52.down_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.53.down_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.54.down_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.55.down_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.56.down_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.57.down_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.58.down_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.59.down_proj.weight": "model-00087-of-00132.safetensors", + "model.layers.62.mlp.experts.60.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.61.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.62.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.63.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.64.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.65.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.66.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.67.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.68.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.69.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.70.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.71.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.72.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.73.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.74.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.75.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.76.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.77.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.78.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.79.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.80.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.81.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.82.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.83.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.84.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.85.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.86.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.87.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.88.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.89.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.90.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.91.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.92.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.93.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.94.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.95.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.96.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.97.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.98.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.99.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.100.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.101.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.102.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.103.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.104.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.105.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.106.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.107.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.108.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.109.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.110.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.111.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.112.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.113.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.114.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.115.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.116.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.117.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.118.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.119.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.120.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.121.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.122.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.123.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.124.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.125.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.126.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.127.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.128.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.129.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.130.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.131.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.132.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.133.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.134.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.135.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.136.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.137.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.138.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.139.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.140.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.141.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.142.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.143.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.144.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.145.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.146.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.147.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.148.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.149.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.150.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.151.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.152.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.153.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.154.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.155.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.156.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.157.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.158.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.experts.159.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.shared_experts.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.shared_experts.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.62.mlp.shared_experts.down_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.input_layernorm.weight": "model-00088-of-00132.safetensors", + "model.layers.63.self_attn.q_proj.bias": "model-00088-of-00132.safetensors", + "model.layers.63.self_attn.k_proj.bias": "model-00088-of-00132.safetensors", + "model.layers.63.self_attn.v_proj.bias": "model-00088-of-00132.safetensors", + "model.layers.63.self_attn.q_norm.weight": "model-00088-of-00132.safetensors", + "model.layers.63.self_attn.k_norm.weight": "model-00088-of-00132.safetensors", + "model.layers.63.post_attention_layernorm.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.gate.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.gate.e_score_correction_bias": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.0.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.0.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.1.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.1.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.2.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.2.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.3.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.3.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.4.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.4.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.5.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.5.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.6.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.6.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.7.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.7.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.8.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.8.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.9.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.9.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.10.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.10.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.11.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.11.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.12.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.12.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.13.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.13.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.14.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.14.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.15.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.15.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.16.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.16.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.17.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.17.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.18.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.18.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.19.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.19.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.20.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.20.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.21.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.21.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.22.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.22.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.23.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.23.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.24.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.24.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.25.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.25.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.26.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.26.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.27.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.27.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.28.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.28.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.29.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.29.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.30.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.30.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.31.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.31.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.32.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.32.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.33.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.33.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.34.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.34.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.35.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.35.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.36.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.36.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.37.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.37.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.38.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.38.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.39.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.39.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.40.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.40.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.41.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.41.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.42.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.42.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.43.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.43.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.44.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.44.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.45.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.45.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.46.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.46.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.47.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.47.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.48.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.48.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.49.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.49.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.50.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.50.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.51.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.51.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.52.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.52.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.53.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.53.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.54.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.54.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.55.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.55.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.56.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.56.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.57.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.57.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.58.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.58.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.59.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.59.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.60.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.60.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.61.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.61.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.62.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.62.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.63.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.63.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.64.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.64.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.65.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.65.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.66.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.66.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.67.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.67.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.68.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.68.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.69.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.69.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.70.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.70.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.71.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.71.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.72.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.72.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.73.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.73.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.74.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.74.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.75.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.75.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.76.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.76.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.77.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.77.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.78.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.78.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.79.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.79.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.80.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.80.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.81.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.81.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.82.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.82.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.83.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.83.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.84.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.84.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.85.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.85.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.86.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.86.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.87.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.87.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.88.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.88.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.89.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.89.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.90.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.90.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.91.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.91.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.92.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.92.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.93.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.93.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.94.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.94.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.95.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.95.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.96.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.96.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.97.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.97.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.98.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.98.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.99.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.99.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.100.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.100.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.101.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.101.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.102.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.102.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.103.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.103.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.104.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.104.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.105.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.105.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.106.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.106.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.107.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.107.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.108.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.108.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.109.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.109.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.110.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.110.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.111.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.111.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.112.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.112.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.113.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.113.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.114.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.114.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.115.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.115.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.116.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.116.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.117.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.117.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.118.gate_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.118.up_proj.weight": "model-00088-of-00132.safetensors", + "model.layers.63.mlp.experts.119.gate_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.119.up_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.120.gate_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.120.up_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.121.gate_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.121.up_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.122.gate_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.122.up_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.123.gate_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.123.up_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.124.gate_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.124.up_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.125.gate_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.125.up_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.126.gate_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.126.up_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.127.gate_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.127.up_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.128.gate_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.128.up_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.129.gate_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.129.up_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.130.gate_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.130.up_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.131.gate_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.131.up_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.132.gate_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.132.up_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.133.gate_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.133.up_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.134.gate_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.134.up_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.135.gate_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.135.up_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.136.gate_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.136.up_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.137.gate_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.137.up_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.138.gate_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.138.up_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.139.gate_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.139.up_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.140.gate_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.140.up_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.141.gate_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.141.up_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.142.gate_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.142.up_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.143.gate_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.143.up_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.144.gate_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.144.up_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.145.gate_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.145.up_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.146.gate_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.146.up_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.147.gate_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.147.up_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.148.gate_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.148.up_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.149.gate_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.149.up_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.150.gate_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.150.up_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.151.gate_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.151.up_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.152.gate_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.152.up_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.153.gate_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.153.up_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.154.gate_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.154.up_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.155.gate_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.155.up_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.156.gate_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.156.up_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.157.gate_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.157.up_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.158.gate_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.158.up_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.159.gate_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.159.up_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.0.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.1.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.2.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.3.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.4.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.5.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.6.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.7.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.8.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.9.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.10.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.11.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.12.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.13.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.14.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.15.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.16.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.17.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.18.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.19.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.20.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.21.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.22.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.23.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.24.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.25.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.26.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.27.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.28.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.29.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.30.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.31.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.32.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.33.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.34.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.35.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.36.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.37.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.38.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.39.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.40.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.41.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.42.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.43.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.44.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.45.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.46.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.47.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.48.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.49.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.50.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.51.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.52.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.53.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.54.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.55.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.56.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.57.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.58.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.59.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.60.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.61.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.62.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.63.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.64.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.65.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.66.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.67.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.68.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.69.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.70.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.71.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.72.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.73.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.74.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.75.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.76.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.77.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.78.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.79.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.80.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.81.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.82.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.83.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.84.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.85.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.86.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.87.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.88.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.89.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.90.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.91.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.92.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.93.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.94.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.95.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.96.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.97.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.98.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.99.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.100.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.101.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.102.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.103.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.104.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.105.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.106.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.107.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.108.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.109.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.110.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.111.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.112.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.113.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.114.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.115.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.116.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.117.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.118.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.119.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.120.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.121.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.122.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.123.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.124.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.125.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.126.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.127.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.128.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.129.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.130.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.131.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.132.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.133.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.134.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.135.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.136.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.137.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.138.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.139.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.140.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.141.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.142.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.143.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.144.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.145.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.146.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.147.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.148.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.149.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.150.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.151.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.152.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.153.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.154.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.155.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.156.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.157.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.158.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.experts.159.down_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.shared_experts.gate_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.63.mlp.shared_experts.up_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.64.self_attn.o_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.64.input_layernorm.weight": "model-00089-of-00132.safetensors", + "model.layers.64.self_attn.q_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.64.self_attn.k_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.64.self_attn.v_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.64.self_attn.q_proj.bias": "model-00089-of-00132.safetensors", + "model.layers.64.self_attn.k_proj.bias": "model-00089-of-00132.safetensors", + "model.layers.64.self_attn.v_proj.bias": "model-00089-of-00132.safetensors", + "model.layers.64.self_attn.q_norm.weight": "model-00089-of-00132.safetensors", + "model.layers.64.self_attn.k_norm.weight": "model-00089-of-00132.safetensors", + "model.layers.64.post_attention_layernorm.weight": "model-00089-of-00132.safetensors", + "model.layers.64.mlp.gate.e_score_correction_bias": "model-00089-of-00132.safetensors", + "model.layers.64.mlp.experts.0.gate_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.64.mlp.experts.0.up_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.64.mlp.experts.1.gate_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.64.mlp.experts.1.up_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.64.mlp.experts.2.gate_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.64.mlp.experts.2.up_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.64.mlp.experts.3.gate_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.64.mlp.experts.3.up_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.64.mlp.experts.4.gate_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.64.mlp.experts.4.up_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.64.mlp.experts.5.gate_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.64.mlp.experts.5.up_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.64.mlp.experts.6.gate_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.64.mlp.experts.6.up_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.64.mlp.experts.7.gate_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.64.mlp.experts.7.up_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.64.mlp.experts.8.gate_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.64.mlp.experts.8.up_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.64.mlp.experts.9.gate_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.64.mlp.experts.9.up_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.64.mlp.experts.10.gate_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.64.mlp.experts.10.up_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.64.mlp.experts.11.gate_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.64.mlp.experts.11.up_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.64.mlp.experts.12.gate_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.64.mlp.experts.12.up_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.64.mlp.experts.13.gate_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.64.mlp.experts.13.up_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.64.mlp.experts.14.gate_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.64.mlp.experts.14.up_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.64.mlp.experts.15.gate_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.64.mlp.experts.15.up_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.64.mlp.experts.16.gate_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.64.mlp.experts.16.up_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.64.mlp.experts.17.gate_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.64.mlp.experts.17.up_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.64.mlp.experts.18.gate_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.64.mlp.experts.18.up_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.64.mlp.experts.19.gate_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.64.mlp.experts.19.up_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.64.mlp.experts.20.gate_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.64.mlp.experts.20.up_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.64.mlp.experts.21.gate_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.64.mlp.experts.21.up_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.64.mlp.experts.22.gate_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.64.mlp.experts.22.up_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.64.mlp.experts.23.gate_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.64.mlp.experts.23.up_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.64.mlp.experts.24.gate_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.64.mlp.experts.24.up_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.64.mlp.experts.25.gate_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.64.mlp.experts.25.up_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.64.mlp.experts.26.gate_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.64.mlp.experts.26.up_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.64.mlp.experts.27.gate_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.64.mlp.experts.27.up_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.64.mlp.experts.28.gate_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.64.mlp.experts.28.up_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.64.mlp.experts.29.gate_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.64.mlp.experts.29.up_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.64.mlp.experts.30.gate_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.64.mlp.experts.30.up_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.64.mlp.experts.31.gate_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.64.mlp.experts.31.up_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.64.mlp.experts.32.gate_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.64.mlp.experts.32.up_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.64.mlp.experts.33.gate_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.64.mlp.experts.33.up_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.64.mlp.experts.34.gate_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.64.mlp.experts.34.up_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.64.mlp.experts.35.gate_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.64.mlp.experts.35.up_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.64.mlp.experts.36.gate_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.64.mlp.experts.36.up_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.64.mlp.experts.37.gate_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.64.mlp.experts.37.up_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.64.mlp.experts.38.gate_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.64.mlp.experts.38.up_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.64.mlp.experts.39.gate_proj.weight": "model-00089-of-00132.safetensors", + "model.layers.64.mlp.experts.39.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.40.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.40.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.41.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.41.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.42.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.42.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.43.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.43.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.44.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.44.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.45.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.45.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.46.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.46.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.47.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.47.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.48.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.48.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.49.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.49.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.50.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.50.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.51.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.51.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.52.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.52.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.53.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.53.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.54.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.54.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.55.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.55.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.56.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.56.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.57.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.57.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.58.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.58.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.59.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.59.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.60.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.60.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.61.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.61.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.62.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.62.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.63.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.63.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.64.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.64.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.65.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.65.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.66.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.66.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.67.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.67.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.68.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.68.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.69.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.69.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.70.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.70.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.71.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.71.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.72.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.72.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.73.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.73.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.74.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.74.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.75.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.75.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.76.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.76.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.77.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.77.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.78.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.78.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.79.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.79.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.80.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.80.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.81.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.81.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.82.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.82.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.83.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.83.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.84.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.84.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.85.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.85.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.86.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.86.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.87.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.87.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.88.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.88.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.89.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.89.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.90.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.90.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.91.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.91.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.92.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.92.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.93.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.93.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.94.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.94.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.95.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.95.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.96.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.96.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.97.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.97.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.98.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.98.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.99.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.99.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.100.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.100.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.101.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.101.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.102.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.102.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.103.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.103.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.104.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.104.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.105.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.105.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.106.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.106.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.107.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.107.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.108.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.108.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.109.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.109.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.110.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.110.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.111.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.111.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.112.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.112.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.113.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.113.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.114.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.114.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.115.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.115.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.116.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.116.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.117.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.117.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.118.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.118.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.119.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.119.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.120.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.120.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.121.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.121.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.122.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.122.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.123.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.123.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.124.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.124.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.125.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.125.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.126.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.126.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.127.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.127.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.128.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.128.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.129.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.129.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.130.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.130.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.131.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.131.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.132.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.132.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.133.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.133.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.134.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.134.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.135.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.135.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.136.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.136.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.137.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.137.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.138.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.138.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.139.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.139.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.140.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.140.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.141.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.141.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.142.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.142.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.143.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.143.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.144.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.144.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.145.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.145.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.146.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.146.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.147.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.147.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.148.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.148.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.149.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.149.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.150.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.150.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.151.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.151.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.152.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.152.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.153.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.153.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.154.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.154.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.155.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.155.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.156.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.156.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.157.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.157.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.158.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.158.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.159.gate_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.159.up_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.0.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.1.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.2.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.3.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.4.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.5.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.6.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.7.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.8.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.9.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.10.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.11.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.12.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.13.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.14.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.15.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.16.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.17.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.18.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.19.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.20.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.21.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.22.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.23.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.24.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.25.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.26.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.27.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.28.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.29.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.30.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.31.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.32.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.33.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.34.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.35.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.36.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.37.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.38.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.39.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.40.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.41.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.42.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.43.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.44.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.45.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.46.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.47.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.48.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.49.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.50.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.51.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.52.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.53.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.54.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.55.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.56.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.57.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.58.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.59.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.60.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.61.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.62.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.63.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.64.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.65.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.66.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.67.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.68.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.69.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.70.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.71.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.72.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.73.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.74.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.75.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.76.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.77.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.78.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.79.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.80.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.81.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.82.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.83.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.84.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.85.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.86.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.87.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.88.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.89.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.90.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.91.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.92.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.93.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.94.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.95.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.96.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.97.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.98.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.99.down_proj.weight": "model-00090-of-00132.safetensors", + "model.layers.64.mlp.experts.100.down_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.64.mlp.experts.101.down_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.64.mlp.experts.102.down_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.64.mlp.experts.103.down_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.64.mlp.experts.104.down_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.64.mlp.experts.105.down_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.64.mlp.experts.106.down_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.64.mlp.experts.107.down_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.64.mlp.experts.108.down_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.64.mlp.experts.109.down_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.64.mlp.experts.110.down_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.64.mlp.experts.111.down_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.64.mlp.experts.112.down_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.64.mlp.experts.113.down_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.64.mlp.experts.114.down_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.64.mlp.experts.115.down_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.64.mlp.experts.116.down_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.64.mlp.experts.117.down_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.64.mlp.experts.118.down_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.64.mlp.experts.119.down_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.64.mlp.experts.120.down_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.64.mlp.experts.121.down_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.64.mlp.experts.122.down_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.64.mlp.experts.123.down_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.64.mlp.experts.124.down_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.64.mlp.experts.125.down_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.64.mlp.experts.126.down_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.64.mlp.experts.127.down_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.64.mlp.experts.128.down_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.64.mlp.experts.129.down_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.64.mlp.experts.130.down_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.64.mlp.experts.131.down_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.64.mlp.experts.132.down_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.64.mlp.experts.133.down_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.64.mlp.experts.134.down_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.64.mlp.experts.135.down_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.64.mlp.experts.136.down_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.64.mlp.experts.137.down_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.64.mlp.experts.138.down_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.64.mlp.experts.139.down_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.64.mlp.experts.140.down_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.64.mlp.experts.141.down_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.64.mlp.experts.142.down_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.64.mlp.experts.143.down_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.64.mlp.experts.144.down_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.64.mlp.experts.145.down_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.64.mlp.experts.146.down_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.64.mlp.experts.147.down_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.64.mlp.experts.148.down_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.64.mlp.experts.149.down_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.64.mlp.experts.150.down_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.64.mlp.experts.151.down_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.64.mlp.experts.152.down_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.64.mlp.experts.153.down_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.64.mlp.experts.154.down_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.64.mlp.experts.155.down_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.64.mlp.experts.156.down_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.64.mlp.experts.157.down_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.64.mlp.experts.158.down_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.64.mlp.experts.159.down_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.64.mlp.shared_experts.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.64.mlp.shared_experts.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.64.mlp.shared_experts.down_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.input_layernorm.weight": "model-00091-of-00132.safetensors", + "model.layers.65.self_attn.q_proj.bias": "model-00091-of-00132.safetensors", + "model.layers.65.self_attn.k_proj.bias": "model-00091-of-00132.safetensors", + "model.layers.65.self_attn.v_proj.bias": "model-00091-of-00132.safetensors", + "model.layers.65.self_attn.q_norm.weight": "model-00091-of-00132.safetensors", + "model.layers.65.self_attn.k_norm.weight": "model-00091-of-00132.safetensors", + "model.layers.65.post_attention_layernorm.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.gate.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.gate.e_score_correction_bias": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.0.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.0.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.1.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.1.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.2.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.2.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.3.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.3.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.4.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.4.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.5.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.5.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.6.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.6.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.7.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.7.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.8.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.8.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.9.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.9.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.10.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.10.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.11.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.11.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.12.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.12.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.13.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.13.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.14.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.14.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.15.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.15.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.16.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.16.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.17.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.17.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.18.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.18.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.19.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.19.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.20.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.20.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.21.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.21.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.22.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.22.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.23.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.23.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.24.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.24.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.25.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.25.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.26.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.26.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.27.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.27.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.28.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.28.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.29.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.29.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.30.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.30.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.31.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.31.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.32.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.32.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.33.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.33.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.34.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.34.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.35.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.35.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.36.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.36.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.37.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.37.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.38.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.38.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.39.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.39.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.40.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.40.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.41.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.41.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.42.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.42.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.43.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.43.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.44.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.44.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.45.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.45.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.46.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.46.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.47.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.47.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.48.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.48.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.49.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.49.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.50.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.50.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.51.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.51.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.52.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.52.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.53.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.53.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.54.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.54.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.55.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.55.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.56.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.56.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.57.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.57.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.58.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.58.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.59.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.59.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.60.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.60.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.61.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.61.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.62.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.62.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.63.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.63.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.64.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.64.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.65.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.65.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.66.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.66.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.67.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.67.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.68.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.68.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.69.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.69.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.70.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.70.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.71.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.71.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.72.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.72.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.73.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.73.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.74.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.74.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.75.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.75.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.76.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.76.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.77.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.77.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.78.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.78.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.79.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.79.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.80.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.80.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.81.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.81.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.82.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.82.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.83.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.83.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.84.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.84.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.85.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.85.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.86.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.86.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.87.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.87.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.88.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.88.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.89.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.89.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.90.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.90.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.91.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.91.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.92.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.92.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.93.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.93.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.94.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.94.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.95.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.95.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.96.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.96.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.97.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.97.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.98.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.98.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.99.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.99.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.100.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.100.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.101.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.101.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.102.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.102.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.103.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.103.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.104.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.104.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.105.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.105.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.106.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.106.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.107.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.107.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.108.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.108.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.109.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.109.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.110.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.110.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.111.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.111.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.112.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.112.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.113.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.113.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.114.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.114.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.115.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.115.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.116.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.116.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.117.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.117.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.118.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.118.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.119.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.119.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.120.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.120.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.121.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.121.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.122.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.122.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.123.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.123.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.124.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.124.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.125.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.125.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.126.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.126.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.127.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.127.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.128.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.128.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.129.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.129.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.130.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.130.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.131.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.131.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.132.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.132.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.133.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.133.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.134.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.134.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.135.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.135.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.136.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.136.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.137.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.137.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.138.gate_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.138.up_proj.weight": "model-00091-of-00132.safetensors", + "model.layers.65.mlp.experts.139.gate_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.139.up_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.140.gate_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.140.up_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.141.gate_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.141.up_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.142.gate_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.142.up_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.143.gate_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.143.up_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.144.gate_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.144.up_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.145.gate_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.145.up_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.146.gate_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.146.up_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.147.gate_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.147.up_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.148.gate_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.148.up_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.149.gate_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.149.up_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.150.gate_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.150.up_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.151.gate_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.151.up_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.152.gate_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.152.up_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.153.gate_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.153.up_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.154.gate_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.154.up_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.155.gate_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.155.up_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.156.gate_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.156.up_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.157.gate_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.157.up_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.158.gate_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.158.up_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.159.gate_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.159.up_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.0.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.1.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.2.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.3.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.4.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.5.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.6.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.7.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.8.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.9.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.10.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.11.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.12.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.13.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.14.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.15.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.16.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.17.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.18.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.19.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.20.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.21.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.22.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.23.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.24.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.25.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.26.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.27.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.28.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.29.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.30.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.31.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.32.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.33.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.34.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.35.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.36.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.37.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.38.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.39.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.40.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.41.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.42.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.43.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.44.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.45.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.46.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.47.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.48.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.49.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.50.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.51.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.52.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.53.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.54.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.55.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.56.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.57.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.58.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.59.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.60.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.61.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.62.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.63.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.64.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.65.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.66.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.67.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.68.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.69.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.70.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.71.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.72.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.73.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.74.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.75.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.76.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.77.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.78.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.79.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.80.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.81.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.82.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.83.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.84.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.85.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.86.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.87.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.88.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.89.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.90.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.91.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.92.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.93.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.94.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.95.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.96.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.97.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.98.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.99.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.100.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.101.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.102.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.103.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.104.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.105.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.106.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.107.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.108.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.109.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.110.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.111.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.112.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.113.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.114.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.115.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.116.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.117.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.118.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.119.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.120.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.121.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.122.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.123.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.124.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.125.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.126.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.127.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.128.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.129.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.130.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.131.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.132.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.133.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.134.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.135.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.136.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.137.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.138.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.139.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.140.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.141.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.142.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.143.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.144.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.145.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.146.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.147.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.148.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.149.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.150.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.151.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.152.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.153.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.154.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.155.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.156.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.157.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.158.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.experts.159.down_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.shared_experts.gate_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.65.mlp.shared_experts.up_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.self_attn.o_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.input_layernorm.weight": "model-00092-of-00132.safetensors", + "model.layers.66.self_attn.q_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.self_attn.k_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.self_attn.v_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.self_attn.q_proj.bias": "model-00092-of-00132.safetensors", + "model.layers.66.self_attn.k_proj.bias": "model-00092-of-00132.safetensors", + "model.layers.66.self_attn.v_proj.bias": "model-00092-of-00132.safetensors", + "model.layers.66.self_attn.q_norm.weight": "model-00092-of-00132.safetensors", + "model.layers.66.self_attn.k_norm.weight": "model-00092-of-00132.safetensors", + "model.layers.66.post_attention_layernorm.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.gate.e_score_correction_bias": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.0.gate_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.0.up_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.1.gate_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.1.up_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.2.gate_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.2.up_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.3.gate_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.3.up_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.4.gate_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.4.up_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.5.gate_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.5.up_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.6.gate_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.6.up_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.7.gate_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.7.up_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.8.gate_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.8.up_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.9.gate_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.9.up_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.10.gate_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.10.up_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.11.gate_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.11.up_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.12.gate_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.12.up_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.13.gate_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.13.up_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.14.gate_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.14.up_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.15.gate_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.15.up_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.16.gate_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.16.up_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.17.gate_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.17.up_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.18.gate_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.18.up_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.19.gate_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.19.up_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.20.gate_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.20.up_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.21.gate_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.21.up_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.22.gate_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.22.up_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.23.gate_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.23.up_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.24.gate_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.24.up_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.25.gate_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.25.up_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.26.gate_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.26.up_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.27.gate_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.27.up_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.28.gate_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.28.up_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.29.gate_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.29.up_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.30.gate_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.30.up_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.31.gate_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.31.up_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.32.gate_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.32.up_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.33.gate_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.33.up_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.34.gate_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.34.up_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.35.gate_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.35.up_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.36.gate_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.36.up_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.37.gate_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.37.up_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.38.gate_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.38.up_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.39.gate_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.39.up_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.40.gate_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.40.up_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.41.gate_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.41.up_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.42.gate_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.42.up_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.43.gate_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.43.up_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.44.gate_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.44.up_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.45.gate_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.45.up_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.46.gate_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.46.up_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.47.gate_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.47.up_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.48.gate_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.48.up_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.49.gate_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.49.up_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.50.gate_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.50.up_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.51.gate_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.51.up_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.52.gate_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.52.up_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.53.gate_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.53.up_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.54.gate_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.54.up_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.55.gate_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.55.up_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.56.gate_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.56.up_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.57.gate_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.57.up_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.58.gate_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.58.up_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.59.gate_proj.weight": "model-00092-of-00132.safetensors", + "model.layers.66.mlp.experts.59.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.60.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.60.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.61.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.61.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.62.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.62.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.63.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.63.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.64.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.64.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.65.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.65.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.66.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.66.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.67.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.67.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.68.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.68.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.69.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.69.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.70.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.70.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.71.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.71.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.72.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.72.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.73.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.73.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.74.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.74.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.75.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.75.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.76.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.76.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.77.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.77.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.78.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.78.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.79.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.79.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.80.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.80.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.81.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.81.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.82.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.82.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.83.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.83.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.84.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.84.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.85.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.85.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.86.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.86.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.87.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.87.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.88.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.88.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.89.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.89.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.90.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.90.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.91.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.91.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.92.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.92.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.93.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.93.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.94.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.94.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.95.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.95.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.96.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.96.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.97.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.97.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.98.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.98.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.99.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.99.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.100.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.100.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.101.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.101.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.102.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.102.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.103.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.103.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.104.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.104.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.105.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.105.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.106.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.106.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.107.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.107.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.108.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.108.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.109.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.109.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.110.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.110.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.111.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.111.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.112.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.112.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.113.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.113.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.114.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.114.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.115.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.115.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.116.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.116.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.117.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.117.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.118.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.118.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.119.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.119.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.120.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.120.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.121.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.121.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.122.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.122.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.123.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.123.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.124.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.124.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.125.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.125.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.126.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.126.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.127.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.127.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.128.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.128.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.129.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.129.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.130.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.130.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.131.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.131.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.132.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.132.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.133.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.133.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.134.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.134.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.135.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.135.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.136.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.136.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.137.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.137.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.138.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.138.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.139.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.139.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.140.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.140.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.141.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.141.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.142.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.142.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.143.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.143.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.144.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.144.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.145.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.145.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.146.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.146.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.147.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.147.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.148.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.148.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.149.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.149.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.150.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.150.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.151.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.151.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.152.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.152.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.153.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.153.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.154.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.154.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.155.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.155.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.156.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.156.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.157.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.157.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.158.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.158.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.159.gate_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.159.up_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.0.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.1.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.2.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.3.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.4.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.5.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.6.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.7.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.8.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.9.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.10.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.11.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.12.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.13.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.14.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.15.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.16.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.17.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.18.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.19.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.20.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.21.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.22.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.23.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.24.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.25.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.26.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.27.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.28.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.29.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.30.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.31.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.32.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.33.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.34.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.35.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.36.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.37.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.38.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.39.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.40.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.41.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.42.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.43.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.44.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.45.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.46.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.47.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.48.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.49.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.50.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.51.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.52.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.53.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.54.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.55.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.56.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.57.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.58.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.59.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.60.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.61.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.62.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.63.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.64.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.65.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.66.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.67.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.68.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.69.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.70.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.71.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.72.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.73.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.74.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.75.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.76.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.77.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.78.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.79.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.80.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.81.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.82.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.83.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.84.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.85.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.86.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.87.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.88.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.89.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.90.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.91.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.92.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.93.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.94.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.95.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.96.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.97.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.98.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.99.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.100.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.101.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.102.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.103.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.104.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.105.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.106.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.107.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.108.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.109.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.110.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.111.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.112.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.113.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.114.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.115.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.116.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.117.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.118.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.119.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.120.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.121.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.122.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.123.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.124.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.125.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.126.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.127.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.128.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.129.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.130.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.131.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.132.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.133.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.134.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.135.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.136.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.137.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.138.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.139.down_proj.weight": "model-00093-of-00132.safetensors", + "model.layers.66.mlp.experts.140.down_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.66.mlp.experts.141.down_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.66.mlp.experts.142.down_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.66.mlp.experts.143.down_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.66.mlp.experts.144.down_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.66.mlp.experts.145.down_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.66.mlp.experts.146.down_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.66.mlp.experts.147.down_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.66.mlp.experts.148.down_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.66.mlp.experts.149.down_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.66.mlp.experts.150.down_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.66.mlp.experts.151.down_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.66.mlp.experts.152.down_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.66.mlp.experts.153.down_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.66.mlp.experts.154.down_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.66.mlp.experts.155.down_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.66.mlp.experts.156.down_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.66.mlp.experts.157.down_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.66.mlp.experts.158.down_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.66.mlp.experts.159.down_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.66.mlp.shared_experts.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.66.mlp.shared_experts.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.66.mlp.shared_experts.down_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.input_layernorm.weight": "model-00094-of-00132.safetensors", + "model.layers.67.self_attn.q_proj.bias": "model-00094-of-00132.safetensors", + "model.layers.67.self_attn.k_proj.bias": "model-00094-of-00132.safetensors", + "model.layers.67.self_attn.v_proj.bias": "model-00094-of-00132.safetensors", + "model.layers.67.self_attn.q_norm.weight": "model-00094-of-00132.safetensors", + "model.layers.67.self_attn.k_norm.weight": "model-00094-of-00132.safetensors", + "model.layers.67.post_attention_layernorm.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.gate.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.gate.e_score_correction_bias": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.0.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.0.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.1.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.1.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.2.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.2.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.3.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.3.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.4.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.4.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.5.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.5.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.6.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.6.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.7.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.7.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.8.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.8.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.9.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.9.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.10.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.10.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.11.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.11.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.12.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.12.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.13.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.13.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.14.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.14.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.15.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.15.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.16.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.16.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.17.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.17.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.18.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.18.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.19.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.19.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.20.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.20.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.21.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.21.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.22.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.22.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.23.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.23.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.24.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.24.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.25.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.25.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.26.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.26.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.27.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.27.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.28.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.28.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.29.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.29.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.30.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.30.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.31.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.31.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.32.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.32.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.33.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.33.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.34.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.34.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.35.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.35.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.36.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.36.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.37.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.37.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.38.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.38.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.39.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.39.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.40.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.40.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.41.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.41.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.42.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.42.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.43.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.43.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.44.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.44.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.45.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.45.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.46.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.46.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.47.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.47.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.48.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.48.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.49.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.49.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.50.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.50.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.51.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.51.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.52.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.52.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.53.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.53.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.54.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.54.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.55.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.55.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.56.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.56.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.57.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.57.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.58.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.58.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.59.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.59.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.60.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.60.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.61.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.61.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.62.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.62.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.63.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.63.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.64.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.64.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.65.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.65.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.66.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.66.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.67.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.67.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.68.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.68.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.69.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.69.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.70.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.70.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.71.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.71.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.72.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.72.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.73.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.73.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.74.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.74.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.75.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.75.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.76.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.76.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.77.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.77.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.78.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.78.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.79.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.79.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.80.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.80.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.81.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.81.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.82.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.82.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.83.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.83.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.84.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.84.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.85.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.85.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.86.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.86.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.87.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.87.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.88.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.88.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.89.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.89.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.90.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.90.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.91.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.91.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.92.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.92.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.93.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.93.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.94.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.94.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.95.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.95.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.96.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.96.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.97.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.97.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.98.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.98.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.99.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.99.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.100.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.100.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.101.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.101.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.102.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.102.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.103.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.103.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.104.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.104.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.105.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.105.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.106.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.106.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.107.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.107.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.108.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.108.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.109.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.109.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.110.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.110.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.111.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.111.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.112.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.112.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.113.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.113.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.114.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.114.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.115.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.115.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.116.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.116.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.117.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.117.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.118.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.118.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.119.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.119.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.120.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.120.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.121.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.121.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.122.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.122.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.123.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.123.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.124.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.124.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.125.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.125.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.126.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.126.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.127.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.127.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.128.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.128.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.129.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.129.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.130.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.130.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.131.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.131.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.132.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.132.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.133.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.133.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.134.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.134.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.135.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.135.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.136.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.136.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.137.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.137.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.138.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.138.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.139.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.139.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.140.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.140.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.141.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.141.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.142.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.142.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.143.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.143.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.144.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.144.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.145.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.145.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.146.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.146.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.147.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.147.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.148.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.148.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.149.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.149.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.150.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.150.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.151.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.151.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.152.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.152.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.153.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.153.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.154.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.154.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.155.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.155.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.156.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.156.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.157.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.157.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.158.gate_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.158.up_proj.weight": "model-00094-of-00132.safetensors", + "model.layers.67.mlp.experts.159.gate_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.159.up_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.0.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.1.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.2.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.3.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.4.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.5.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.6.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.7.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.8.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.9.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.10.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.11.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.12.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.13.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.14.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.15.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.16.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.17.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.18.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.19.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.20.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.21.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.22.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.23.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.24.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.25.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.26.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.27.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.28.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.29.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.30.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.31.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.32.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.33.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.34.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.35.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.36.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.37.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.38.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.39.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.40.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.41.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.42.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.43.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.44.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.45.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.46.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.47.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.48.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.49.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.50.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.51.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.52.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.53.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.54.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.55.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.56.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.57.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.58.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.59.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.60.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.61.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.62.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.63.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.64.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.65.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.66.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.67.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.68.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.69.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.70.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.71.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.72.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.73.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.74.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.75.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.76.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.77.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.78.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.79.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.80.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.81.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.82.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.83.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.84.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.85.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.86.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.87.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.88.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.89.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.90.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.91.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.92.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.93.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.94.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.95.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.96.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.97.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.98.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.99.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.100.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.101.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.102.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.103.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.104.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.105.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.106.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.107.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.108.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.109.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.110.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.111.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.112.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.113.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.114.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.115.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.116.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.117.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.118.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.119.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.120.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.121.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.122.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.123.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.124.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.125.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.126.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.127.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.128.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.129.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.130.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.131.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.132.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.133.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.134.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.135.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.136.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.137.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.138.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.139.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.140.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.141.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.142.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.143.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.144.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.145.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.146.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.147.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.148.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.149.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.150.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.151.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.152.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.153.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.154.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.155.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.156.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.157.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.158.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.experts.159.down_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.shared_experts.gate_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.67.mlp.shared_experts.up_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.self_attn.o_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.input_layernorm.weight": "model-00095-of-00132.safetensors", + "model.layers.68.self_attn.q_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.self_attn.k_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.self_attn.v_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.self_attn.q_proj.bias": "model-00095-of-00132.safetensors", + "model.layers.68.self_attn.k_proj.bias": "model-00095-of-00132.safetensors", + "model.layers.68.self_attn.v_proj.bias": "model-00095-of-00132.safetensors", + "model.layers.68.self_attn.q_norm.weight": "model-00095-of-00132.safetensors", + "model.layers.68.self_attn.k_norm.weight": "model-00095-of-00132.safetensors", + "model.layers.68.post_attention_layernorm.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.gate.e_score_correction_bias": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.0.gate_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.0.up_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.1.gate_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.1.up_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.2.gate_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.2.up_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.3.gate_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.3.up_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.4.gate_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.4.up_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.5.gate_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.5.up_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.6.gate_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.6.up_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.7.gate_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.7.up_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.8.gate_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.8.up_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.9.gate_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.9.up_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.10.gate_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.10.up_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.11.gate_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.11.up_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.12.gate_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.12.up_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.13.gate_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.13.up_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.14.gate_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.14.up_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.15.gate_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.15.up_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.16.gate_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.16.up_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.17.gate_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.17.up_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.18.gate_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.18.up_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.19.gate_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.19.up_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.20.gate_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.20.up_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.21.gate_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.21.up_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.22.gate_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.22.up_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.23.gate_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.23.up_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.24.gate_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.24.up_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.25.gate_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.25.up_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.26.gate_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.26.up_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.27.gate_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.27.up_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.28.gate_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.28.up_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.29.gate_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.29.up_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.30.gate_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.30.up_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.31.gate_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.31.up_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.32.gate_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.32.up_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.33.gate_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.33.up_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.34.gate_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.34.up_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.35.gate_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.35.up_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.36.gate_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.36.up_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.37.gate_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.37.up_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.38.gate_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.38.up_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.39.gate_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.39.up_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.40.gate_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.40.up_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.41.gate_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.41.up_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.42.gate_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.42.up_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.43.gate_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.43.up_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.44.gate_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.44.up_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.45.gate_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.45.up_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.46.gate_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.46.up_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.47.gate_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.47.up_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.48.gate_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.48.up_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.49.gate_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.49.up_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.50.gate_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.50.up_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.51.gate_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.51.up_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.52.gate_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.52.up_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.53.gate_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.53.up_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.54.gate_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.54.up_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.55.gate_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.55.up_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.56.gate_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.56.up_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.57.gate_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.57.up_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.58.gate_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.58.up_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.59.gate_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.59.up_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.60.gate_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.60.up_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.61.gate_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.61.up_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.62.gate_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.62.up_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.63.gate_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.63.up_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.64.gate_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.64.up_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.65.gate_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.65.up_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.66.gate_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.66.up_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.67.gate_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.67.up_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.68.gate_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.68.up_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.69.gate_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.69.up_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.70.gate_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.70.up_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.71.gate_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.71.up_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.72.gate_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.72.up_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.73.gate_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.73.up_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.74.gate_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.74.up_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.75.gate_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.75.up_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.76.gate_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.76.up_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.77.gate_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.77.up_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.78.gate_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.78.up_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.79.gate_proj.weight": "model-00095-of-00132.safetensors", + "model.layers.68.mlp.experts.79.up_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.80.gate_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.80.up_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.81.gate_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.81.up_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.82.gate_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.82.up_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.83.gate_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.83.up_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.84.gate_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.84.up_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.85.gate_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.85.up_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.86.gate_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.86.up_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.87.gate_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.87.up_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.88.gate_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.88.up_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.89.gate_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.89.up_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.90.gate_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.90.up_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.91.gate_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.91.up_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.92.gate_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.92.up_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.93.gate_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.93.up_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.94.gate_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.94.up_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.95.gate_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.95.up_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.96.gate_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.96.up_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.97.gate_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.97.up_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.98.gate_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.98.up_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.99.gate_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.99.up_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.100.gate_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.100.up_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.101.gate_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.101.up_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.102.gate_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.102.up_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.103.gate_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.103.up_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.104.gate_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.104.up_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.105.gate_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.105.up_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.106.gate_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.106.up_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.107.gate_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.107.up_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.108.gate_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.108.up_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.109.gate_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.109.up_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.110.gate_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.110.up_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.111.gate_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.111.up_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.112.gate_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.112.up_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.113.gate_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.113.up_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.114.gate_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.114.up_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.115.gate_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.115.up_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.116.gate_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.116.up_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.117.gate_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.117.up_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.118.gate_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.118.up_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.119.gate_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.119.up_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.120.gate_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.120.up_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.121.gate_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.121.up_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.122.gate_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.122.up_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.123.gate_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.123.up_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.124.gate_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.124.up_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.125.gate_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.125.up_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.126.gate_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.126.up_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.127.gate_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.127.up_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.128.gate_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.128.up_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.129.gate_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.129.up_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.130.gate_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.130.up_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.131.gate_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.131.up_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.132.gate_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.132.up_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.133.gate_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.133.up_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.134.gate_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.134.up_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.135.gate_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.135.up_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.136.gate_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.136.up_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.137.gate_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.137.up_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.138.gate_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.138.up_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.139.gate_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.139.up_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.140.gate_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.140.up_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.141.gate_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.141.up_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.142.gate_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.142.up_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.143.gate_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.143.up_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.144.gate_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.144.up_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.145.gate_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.145.up_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.146.gate_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.146.up_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.147.gate_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.147.up_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.148.gate_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.148.up_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.149.gate_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.149.up_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.150.gate_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.150.up_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.151.gate_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.151.up_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.152.gate_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.152.up_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.153.gate_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.153.up_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.154.gate_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.154.up_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.155.gate_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.155.up_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.156.gate_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.156.up_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.157.gate_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.157.up_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.158.gate_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.158.up_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.159.gate_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.159.up_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.0.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.1.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.2.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.3.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.4.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.5.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.6.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.7.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.8.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.9.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.10.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.11.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.12.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.13.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.14.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.15.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.16.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.17.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.18.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.19.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.20.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.21.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.22.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.23.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.24.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.25.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.26.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.27.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.28.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.29.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.30.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.31.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.32.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.33.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.34.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.35.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.36.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.37.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.38.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.39.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.40.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.41.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.42.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.43.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.44.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.45.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.46.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.47.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.48.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.49.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.50.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.51.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.52.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.53.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.54.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.55.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.56.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.57.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.58.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.59.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.60.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.61.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.62.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.63.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.64.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.65.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.66.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.67.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.68.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.69.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.70.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.71.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.72.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.73.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.74.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.75.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.76.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.77.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.78.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.79.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.80.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.81.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.82.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.83.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.84.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.85.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.86.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.87.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.88.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.89.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.90.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.91.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.92.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.93.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.94.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.95.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.96.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.97.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.98.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.99.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.100.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.101.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.102.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.103.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.104.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.105.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.106.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.107.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.108.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.109.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.110.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.111.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.112.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.113.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.114.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.115.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.116.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.117.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.118.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.119.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.120.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.121.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.122.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.123.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.124.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.125.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.126.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.127.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.128.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.129.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.130.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.131.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.132.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.133.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.134.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.135.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.136.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.137.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.138.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.139.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.140.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.141.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.142.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.143.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.144.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.145.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.146.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.147.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.148.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.149.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.150.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.151.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.152.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.153.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.154.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.155.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.156.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.157.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.158.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.experts.159.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.shared_experts.gate_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.shared_experts.up_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.68.mlp.shared_experts.down_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.46.self_attn.o_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.46.mlp.gate.weight": "model-00096-of-00132.safetensors", + "model.layers.46.mlp.shared_experts.gate_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.46.mlp.shared_experts.up_proj.weight": "model-00096-of-00132.safetensors", + "model.layers.47.self_attn.o_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.47.self_attn.q_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.47.self_attn.k_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.47.self_attn.v_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.47.mlp.shared_experts.down_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.48.mlp.gate.weight": "model-00097-of-00132.safetensors", + "model.layers.49.self_attn.o_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.49.self_attn.q_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.49.self_attn.k_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.49.self_attn.v_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.49.mlp.shared_experts.down_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.50.mlp.gate.weight": "model-00097-of-00132.safetensors", + "model.layers.51.self_attn.o_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.51.self_attn.q_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.51.self_attn.k_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.51.self_attn.v_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.51.mlp.shared_experts.down_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.52.mlp.gate.weight": "model-00097-of-00132.safetensors", + "model.layers.53.self_attn.o_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.53.self_attn.q_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.53.self_attn.k_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.53.self_attn.v_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.53.mlp.shared_experts.down_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.54.mlp.gate.weight": "model-00097-of-00132.safetensors", + "model.layers.55.self_attn.o_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.55.self_attn.q_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.55.self_attn.k_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.55.self_attn.v_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.55.mlp.shared_experts.down_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.56.mlp.gate.weight": "model-00097-of-00132.safetensors", + "model.layers.57.self_attn.o_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.57.self_attn.q_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.57.self_attn.k_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.57.self_attn.v_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.57.mlp.shared_experts.down_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.58.mlp.gate.weight": "model-00097-of-00132.safetensors", + "model.layers.59.self_attn.o_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.59.self_attn.q_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.59.self_attn.k_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.59.self_attn.v_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.59.mlp.shared_experts.down_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.60.mlp.gate.weight": "model-00097-of-00132.safetensors", + "model.layers.61.self_attn.o_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.61.self_attn.q_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.61.self_attn.k_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.61.self_attn.v_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.61.mlp.shared_experts.down_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.62.mlp.gate.weight": "model-00097-of-00132.safetensors", + "model.layers.63.self_attn.o_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.63.self_attn.q_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.63.self_attn.k_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.63.self_attn.v_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.63.mlp.shared_experts.down_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.64.mlp.gate.weight": "model-00097-of-00132.safetensors", + "model.layers.65.self_attn.o_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.65.self_attn.q_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.65.self_attn.k_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.65.self_attn.v_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.65.mlp.shared_experts.down_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.66.mlp.gate.weight": "model-00097-of-00132.safetensors", + "model.layers.67.self_attn.o_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.67.self_attn.q_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.67.self_attn.k_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.67.self_attn.v_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.67.mlp.shared_experts.down_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.68.mlp.gate.weight": "model-00097-of-00132.safetensors", + "model.layers.69.self_attn.o_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.self_attn.q_norm.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.gate.e_score_correction_bias": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.0.gate_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.0.up_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.1.gate_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.1.up_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.2.gate_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.2.up_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.3.gate_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.3.up_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.4.gate_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.4.up_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.5.gate_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.5.up_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.6.gate_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.6.up_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.7.gate_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.7.up_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.8.gate_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.8.up_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.9.gate_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.9.up_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.10.gate_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.10.up_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.11.gate_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.11.up_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.12.gate_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.12.up_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.13.gate_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.13.up_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.14.gate_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.14.up_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.15.gate_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.15.up_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.16.gate_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.16.up_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.17.gate_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.17.up_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.18.gate_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.18.up_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.19.gate_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.19.up_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.20.gate_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.20.up_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.21.gate_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.21.up_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.22.gate_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.22.up_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.23.gate_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.23.up_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.24.gate_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.24.up_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.25.gate_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.25.up_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.26.gate_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.26.up_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.27.gate_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.27.up_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.28.gate_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.28.up_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.29.gate_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.29.up_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.30.gate_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.30.up_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.31.gate_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.31.up_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.32.gate_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.32.up_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.33.gate_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.33.up_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.34.gate_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.34.up_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.35.gate_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.35.up_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.36.gate_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.36.up_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.37.gate_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.37.up_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.38.gate_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.38.up_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.39.gate_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.39.up_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.40.gate_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.40.up_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.41.gate_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.41.up_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.42.gate_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.42.up_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.43.gate_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.43.up_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.44.gate_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.44.up_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.45.gate_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.45.up_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.46.gate_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.46.up_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.47.gate_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.47.up_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.48.gate_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.48.up_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.49.gate_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.49.up_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.50.gate_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.50.up_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.51.gate_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.51.up_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.52.gate_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.52.up_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.53.gate_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.53.up_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.54.gate_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.54.up_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.55.gate_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.55.up_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.56.gate_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.56.up_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.57.gate_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.57.up_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.58.gate_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.58.up_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.59.gate_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.59.up_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.60.gate_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.60.up_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.61.gate_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.61.up_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.62.gate_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.62.up_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.63.gate_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.63.up_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.64.gate_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.64.up_proj.weight": "model-00097-of-00132.safetensors", + "model.layers.69.mlp.experts.65.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.65.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.66.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.66.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.67.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.67.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.68.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.68.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.69.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.69.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.70.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.70.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.71.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.71.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.72.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.72.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.73.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.73.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.74.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.74.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.75.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.75.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.76.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.76.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.77.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.77.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.78.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.78.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.79.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.79.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.80.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.80.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.81.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.81.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.82.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.82.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.83.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.83.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.84.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.84.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.85.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.85.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.86.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.86.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.87.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.87.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.88.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.88.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.89.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.89.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.90.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.90.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.91.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.91.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.92.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.92.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.93.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.93.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.94.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.94.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.95.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.95.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.96.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.96.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.97.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.97.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.98.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.98.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.99.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.99.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.100.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.100.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.101.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.101.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.102.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.102.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.103.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.103.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.104.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.104.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.105.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.105.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.106.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.106.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.107.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.107.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.108.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.108.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.109.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.109.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.110.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.110.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.111.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.111.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.112.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.112.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.113.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.113.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.114.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.114.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.115.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.115.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.116.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.116.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.117.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.117.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.118.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.118.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.119.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.119.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.120.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.120.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.121.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.121.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.122.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.122.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.123.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.123.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.124.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.124.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.125.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.125.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.126.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.126.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.127.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.127.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.128.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.128.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.129.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.129.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.130.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.130.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.131.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.131.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.132.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.132.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.133.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.133.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.134.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.134.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.135.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.135.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.136.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.136.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.137.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.137.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.138.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.138.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.139.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.139.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.140.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.140.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.141.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.141.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.142.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.142.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.143.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.143.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.144.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.144.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.145.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.145.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.146.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.146.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.147.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.147.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.148.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.148.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.149.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.149.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.150.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.150.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.151.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.151.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.152.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.152.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.153.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.153.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.154.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.154.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.155.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.155.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.156.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.156.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.157.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.157.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.158.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.158.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.159.gate_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.159.up_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.0.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.1.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.2.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.3.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.4.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.5.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.6.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.7.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.8.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.9.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.10.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.11.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.12.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.13.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.14.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.15.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.16.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.17.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.18.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.19.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.20.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.21.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.22.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.23.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.24.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.25.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.26.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.27.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.28.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.29.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.30.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.31.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.32.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.33.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.34.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.35.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.36.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.37.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.38.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.39.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.40.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.41.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.42.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.43.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.44.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.45.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.46.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.47.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.48.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.49.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.50.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.51.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.52.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.53.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.54.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.55.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.56.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.57.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.58.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.59.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.60.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.61.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.62.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.63.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.64.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.65.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.66.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.67.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.68.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.69.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.70.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.71.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.72.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.73.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.74.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.75.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.76.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.77.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.78.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.79.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.80.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.81.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.82.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.83.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.84.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.85.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.86.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.87.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.88.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.89.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.90.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.91.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.92.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.93.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.94.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.95.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.96.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.97.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.98.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.99.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.100.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.101.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.102.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.103.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.104.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.105.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.106.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.107.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.108.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.109.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.110.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.111.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.112.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.113.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.114.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.115.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.116.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.117.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.118.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.119.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.120.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.121.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.122.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.123.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.124.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.125.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.126.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.127.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.128.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.129.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.130.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.131.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.132.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.133.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.134.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.135.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.136.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.137.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.138.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.139.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.140.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.141.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.142.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.143.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.144.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.145.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.146.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.147.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.148.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.149.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.150.down_proj.weight": "model-00098-of-00132.safetensors", + "model.layers.69.mlp.experts.151.down_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.69.mlp.experts.152.down_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.69.mlp.experts.153.down_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.69.mlp.experts.154.down_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.69.mlp.experts.155.down_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.69.mlp.experts.156.down_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.69.mlp.experts.157.down_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.69.mlp.experts.158.down_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.69.mlp.experts.159.down_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.self_attn.q_norm.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.0.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.0.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.1.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.1.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.2.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.2.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.3.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.3.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.4.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.4.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.5.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.5.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.6.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.6.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.7.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.7.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.8.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.8.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.9.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.9.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.10.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.10.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.11.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.11.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.12.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.12.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.13.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.13.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.14.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.14.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.15.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.15.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.16.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.16.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.17.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.17.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.18.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.18.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.19.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.19.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.20.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.20.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.21.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.21.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.22.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.22.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.23.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.23.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.24.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.24.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.25.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.25.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.26.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.26.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.27.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.27.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.28.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.28.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.29.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.29.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.30.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.30.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.31.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.31.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.32.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.32.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.33.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.33.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.34.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.34.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.35.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.35.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.36.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.36.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.37.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.37.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.38.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.38.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.39.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.39.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.40.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.40.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.41.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.41.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.42.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.42.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.43.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.43.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.44.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.44.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.45.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.45.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.46.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.46.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.47.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.47.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.48.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.48.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.49.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.49.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.50.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.50.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.51.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.51.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.52.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.52.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.53.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.53.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.54.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.54.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.55.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.55.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.56.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.56.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.57.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.57.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.58.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.58.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.59.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.59.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.60.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.60.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.61.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.61.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.62.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.62.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.63.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.63.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.64.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.64.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.65.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.65.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.66.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.66.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.67.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.67.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.68.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.68.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.69.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.69.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.70.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.70.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.71.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.71.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.72.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.72.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.73.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.73.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.74.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.74.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.75.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.75.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.76.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.76.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.77.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.77.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.78.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.78.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.79.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.79.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.80.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.80.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.81.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.81.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.82.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.82.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.83.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.83.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.84.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.84.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.85.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.85.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.86.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.86.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.87.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.87.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.88.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.88.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.89.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.89.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.90.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.90.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.91.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.91.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.92.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.92.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.93.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.93.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.94.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.94.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.95.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.95.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.96.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.96.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.97.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.97.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.98.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.98.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.99.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.99.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.100.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.100.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.101.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.101.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.102.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.102.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.103.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.103.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.104.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.104.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.105.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.105.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.106.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.106.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.107.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.107.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.108.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.108.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.109.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.109.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.110.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.110.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.111.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.111.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.112.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.112.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.113.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.113.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.114.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.114.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.115.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.115.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.116.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.116.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.117.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.117.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.118.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.118.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.119.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.119.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.120.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.120.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.121.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.121.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.122.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.122.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.123.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.123.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.124.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.124.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.125.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.125.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.126.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.126.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.127.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.127.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.128.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.128.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.129.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.129.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.130.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.130.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.131.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.131.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.132.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.132.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.133.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.133.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.134.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.134.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.135.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.135.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.136.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.136.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.137.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.137.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.138.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.138.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.139.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.139.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.140.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.140.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.141.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.141.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.142.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.142.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.143.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.143.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.144.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.144.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.145.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.145.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.146.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.146.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.147.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.147.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.148.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.148.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.149.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.149.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.150.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.150.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.151.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.151.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.152.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.152.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.153.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.153.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.154.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.154.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.155.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.155.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.156.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.156.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.157.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.157.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.158.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.158.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.159.gate_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.159.up_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.0.down_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.1.down_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.2.down_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.3.down_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.4.down_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.5.down_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.6.down_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.7.down_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.8.down_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.9.down_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.10.down_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.11.down_proj.weight": "model-00099-of-00132.safetensors", + "model.layers.70.mlp.experts.12.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.13.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.14.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.15.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.16.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.17.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.18.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.19.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.20.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.21.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.22.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.23.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.24.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.25.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.26.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.27.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.28.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.29.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.30.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.31.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.32.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.33.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.34.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.35.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.36.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.37.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.38.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.39.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.40.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.41.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.42.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.43.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.44.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.45.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.46.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.47.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.48.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.49.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.50.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.51.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.52.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.53.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.54.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.55.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.56.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.57.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.58.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.59.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.60.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.61.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.62.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.63.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.64.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.65.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.66.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.67.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.68.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.69.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.70.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.71.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.72.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.73.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.74.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.75.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.76.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.77.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.78.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.79.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.80.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.81.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.82.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.83.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.84.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.85.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.86.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.87.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.88.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.89.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.90.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.91.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.92.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.93.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.94.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.95.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.96.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.97.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.98.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.99.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.100.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.101.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.102.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.103.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.104.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.105.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.106.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.107.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.108.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.109.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.110.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.111.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.112.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.113.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.114.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.115.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.116.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.117.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.118.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.119.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.120.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.121.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.122.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.123.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.124.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.125.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.126.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.127.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.128.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.129.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.130.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.131.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.132.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.133.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.134.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.135.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.136.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.137.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.138.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.139.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.140.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.141.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.142.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.143.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.144.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.145.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.146.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.147.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.148.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.149.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.150.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.151.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.152.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.153.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.154.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.155.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.156.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.157.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.158.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.experts.159.down_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.shared_experts.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.70.mlp.shared_experts.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.self_attn.o_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.self_attn.q_norm.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.gate.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.gate.e_score_correction_bias": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.0.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.0.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.1.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.1.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.2.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.2.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.3.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.3.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.4.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.4.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.5.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.5.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.6.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.6.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.7.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.7.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.8.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.8.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.9.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.9.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.10.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.10.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.11.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.11.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.12.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.12.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.13.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.13.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.14.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.14.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.15.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.15.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.16.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.16.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.17.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.17.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.18.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.18.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.19.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.19.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.20.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.20.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.21.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.21.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.22.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.22.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.23.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.23.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.24.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.24.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.25.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.25.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.26.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.26.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.27.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.27.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.28.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.28.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.29.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.29.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.30.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.30.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.31.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.31.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.32.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.32.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.33.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.33.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.34.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.34.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.35.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.35.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.36.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.36.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.37.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.37.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.38.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.38.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.39.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.39.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.40.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.40.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.41.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.41.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.42.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.42.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.43.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.43.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.44.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.44.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.45.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.45.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.46.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.46.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.47.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.47.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.48.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.48.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.49.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.49.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.50.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.50.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.51.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.51.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.52.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.52.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.53.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.53.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.54.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.54.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.55.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.55.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.56.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.56.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.57.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.57.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.58.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.58.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.59.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.59.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.60.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.60.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.61.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.61.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.62.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.62.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.63.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.63.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.64.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.64.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.65.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.65.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.66.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.66.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.67.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.67.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.68.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.68.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.69.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.69.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.70.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.70.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.71.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.71.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.72.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.72.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.73.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.73.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.74.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.74.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.75.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.75.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.76.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.76.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.77.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.77.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.78.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.78.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.79.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.79.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.80.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.80.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.81.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.81.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.82.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.82.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.83.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.83.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.84.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.84.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.85.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.85.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.86.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.86.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.87.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.87.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.88.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.88.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.89.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.89.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.90.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.90.up_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.91.gate_proj.weight": "model-00100-of-00132.safetensors", + "model.layers.71.mlp.experts.91.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.92.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.92.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.93.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.93.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.94.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.94.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.95.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.95.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.96.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.96.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.97.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.97.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.98.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.98.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.99.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.99.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.100.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.100.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.101.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.101.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.102.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.102.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.103.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.103.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.104.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.104.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.105.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.105.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.106.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.106.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.107.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.107.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.108.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.108.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.109.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.109.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.110.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.110.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.111.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.111.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.112.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.112.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.113.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.113.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.114.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.114.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.115.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.115.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.116.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.116.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.117.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.117.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.118.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.118.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.119.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.119.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.120.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.120.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.121.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.121.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.122.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.122.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.123.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.123.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.124.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.124.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.125.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.125.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.126.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.126.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.127.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.127.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.128.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.128.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.129.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.129.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.130.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.130.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.131.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.131.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.132.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.132.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.133.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.133.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.134.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.134.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.135.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.135.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.136.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.136.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.137.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.137.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.138.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.138.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.139.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.139.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.140.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.140.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.141.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.141.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.142.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.142.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.143.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.143.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.144.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.144.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.145.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.145.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.146.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.146.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.147.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.147.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.148.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.148.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.149.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.149.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.150.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.150.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.151.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.151.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.152.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.152.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.153.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.153.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.154.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.154.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.155.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.155.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.156.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.156.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.157.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.157.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.158.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.158.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.159.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.159.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.0.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.1.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.2.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.3.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.4.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.5.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.6.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.7.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.8.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.9.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.10.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.11.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.12.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.13.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.14.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.15.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.16.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.17.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.18.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.19.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.20.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.21.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.22.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.23.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.24.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.25.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.26.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.27.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.28.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.29.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.30.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.31.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.32.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.33.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.34.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.35.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.36.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.37.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.38.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.39.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.40.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.41.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.42.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.43.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.44.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.45.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.46.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.47.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.48.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.49.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.50.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.51.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.52.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.53.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.54.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.55.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.56.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.57.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.58.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.59.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.60.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.61.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.62.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.63.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.64.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.65.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.66.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.67.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.68.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.69.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.70.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.71.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.72.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.73.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.74.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.75.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.76.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.77.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.78.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.79.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.80.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.81.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.82.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.83.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.84.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.85.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.86.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.87.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.88.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.89.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.90.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.91.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.92.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.93.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.94.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.95.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.96.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.97.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.98.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.99.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.100.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.101.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.102.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.103.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.104.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.105.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.106.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.107.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.108.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.109.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.110.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.111.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.112.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.113.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.114.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.115.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.116.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.117.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.118.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.119.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.120.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.121.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.122.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.123.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.124.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.125.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.126.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.127.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.128.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.129.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.130.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.131.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.132.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.133.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.134.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.135.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.136.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.137.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.138.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.139.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.140.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.141.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.142.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.143.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.144.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.145.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.146.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.147.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.148.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.149.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.150.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.151.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.152.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.153.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.154.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.155.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.156.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.157.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.158.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.experts.159.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.shared_experts.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.shared_experts.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.71.mlp.shared_experts.down_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.72.self_attn.q_proj.bias": "model-00101-of-00132.safetensors", + "model.layers.72.self_attn.k_proj.bias": "model-00101-of-00132.safetensors", + "model.layers.72.self_attn.v_proj.bias": "model-00101-of-00132.safetensors", + "model.layers.72.self_attn.q_norm.weight": "model-00101-of-00132.safetensors", + "model.layers.72.mlp.experts.0.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.72.mlp.experts.0.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.72.mlp.experts.1.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.72.mlp.experts.1.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.72.mlp.experts.2.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.72.mlp.experts.2.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.72.mlp.experts.3.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.72.mlp.experts.3.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.72.mlp.experts.4.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.72.mlp.experts.4.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.72.mlp.experts.5.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.72.mlp.experts.5.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.72.mlp.experts.6.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.72.mlp.experts.6.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.72.mlp.experts.7.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.72.mlp.experts.7.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.72.mlp.experts.8.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.72.mlp.experts.8.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.72.mlp.experts.9.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.72.mlp.experts.9.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.72.mlp.experts.10.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.72.mlp.experts.10.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.72.mlp.experts.11.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.72.mlp.experts.11.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.72.mlp.experts.12.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.72.mlp.experts.12.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.72.mlp.experts.13.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.72.mlp.experts.13.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.72.mlp.experts.14.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.72.mlp.experts.14.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.72.mlp.experts.15.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.72.mlp.experts.15.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.72.mlp.experts.16.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.72.mlp.experts.16.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.72.mlp.experts.17.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.72.mlp.experts.17.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.72.mlp.experts.18.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.72.mlp.experts.18.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.72.mlp.experts.19.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.72.mlp.experts.19.up_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.72.mlp.experts.20.gate_proj.weight": "model-00101-of-00132.safetensors", + "model.layers.72.mlp.experts.20.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.21.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.21.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.22.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.22.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.23.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.23.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.24.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.24.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.25.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.25.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.26.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.26.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.27.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.27.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.28.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.28.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.29.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.29.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.30.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.30.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.31.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.31.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.32.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.32.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.33.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.33.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.34.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.34.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.35.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.35.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.36.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.36.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.37.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.37.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.38.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.38.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.39.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.39.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.40.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.40.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.41.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.41.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.42.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.42.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.43.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.43.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.44.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.44.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.45.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.45.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.46.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.46.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.47.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.47.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.48.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.48.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.49.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.49.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.50.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.50.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.51.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.51.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.52.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.52.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.53.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.53.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.54.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.54.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.55.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.55.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.56.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.56.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.57.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.57.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.58.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.58.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.59.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.59.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.60.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.60.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.61.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.61.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.62.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.62.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.63.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.63.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.64.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.64.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.65.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.65.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.66.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.66.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.67.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.67.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.68.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.68.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.69.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.69.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.70.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.70.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.71.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.71.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.72.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.72.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.73.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.73.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.74.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.74.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.75.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.75.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.76.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.76.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.77.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.77.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.78.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.78.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.79.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.79.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.80.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.80.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.81.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.81.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.82.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.82.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.83.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.83.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.84.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.84.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.85.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.85.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.86.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.86.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.87.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.87.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.88.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.88.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.89.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.89.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.90.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.90.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.91.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.91.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.92.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.92.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.93.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.93.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.94.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.94.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.95.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.95.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.96.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.96.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.97.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.97.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.98.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.98.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.99.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.99.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.100.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.100.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.101.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.101.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.102.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.102.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.103.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.103.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.104.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.104.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.105.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.105.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.106.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.106.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.107.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.107.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.108.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.108.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.109.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.109.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.110.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.110.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.111.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.111.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.112.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.112.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.113.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.113.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.114.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.114.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.115.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.115.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.116.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.116.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.117.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.117.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.118.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.118.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.119.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.119.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.120.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.120.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.121.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.121.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.122.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.122.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.123.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.123.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.124.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.124.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.125.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.125.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.126.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.126.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.127.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.127.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.128.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.128.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.129.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.129.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.130.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.130.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.131.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.131.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.132.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.132.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.133.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.133.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.134.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.134.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.135.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.135.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.136.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.136.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.137.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.137.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.138.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.138.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.139.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.139.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.140.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.140.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.141.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.141.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.142.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.142.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.143.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.143.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.144.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.144.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.145.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.145.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.146.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.146.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.147.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.147.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.148.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.148.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.149.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.149.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.150.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.150.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.151.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.151.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.152.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.152.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.153.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.153.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.154.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.154.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.155.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.155.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.156.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.156.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.157.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.157.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.158.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.158.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.159.gate_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.159.up_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.0.down_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.1.down_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.2.down_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.3.down_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.4.down_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.5.down_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.6.down_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.7.down_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.8.down_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.9.down_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.10.down_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.11.down_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.12.down_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.13.down_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.14.down_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.15.down_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.16.down_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.17.down_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.18.down_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.19.down_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.20.down_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.21.down_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.22.down_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.23.down_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.24.down_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.25.down_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.26.down_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.27.down_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.28.down_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.29.down_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.30.down_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.31.down_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.32.down_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.33.down_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.34.down_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.35.down_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.36.down_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.37.down_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.38.down_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.39.down_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.40.down_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.41.down_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.42.down_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.43.down_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.44.down_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.45.down_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.46.down_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.47.down_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.48.down_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.49.down_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.50.down_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.51.down_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.52.down_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.53.down_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.54.down_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.55.down_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.56.down_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.57.down_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.58.down_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.59.down_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.60.down_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.61.down_proj.weight": "model-00102-of-00132.safetensors", + "model.layers.72.mlp.experts.62.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.63.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.64.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.65.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.66.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.67.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.68.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.69.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.70.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.71.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.72.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.73.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.74.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.75.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.76.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.77.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.78.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.79.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.80.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.81.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.82.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.83.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.84.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.85.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.86.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.87.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.88.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.89.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.90.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.91.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.92.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.93.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.94.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.95.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.96.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.97.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.98.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.99.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.100.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.101.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.102.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.103.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.104.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.105.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.106.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.107.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.108.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.109.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.110.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.111.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.112.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.113.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.114.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.115.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.116.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.117.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.118.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.119.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.120.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.121.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.122.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.123.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.124.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.125.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.126.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.127.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.128.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.129.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.130.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.131.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.132.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.133.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.134.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.135.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.136.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.137.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.138.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.139.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.140.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.141.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.142.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.143.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.144.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.145.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.146.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.147.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.148.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.149.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.150.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.151.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.152.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.153.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.154.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.155.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.156.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.157.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.158.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.experts.159.down_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.shared_experts.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.72.mlp.shared_experts.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.self_attn.o_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.self_attn.q_norm.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.gate.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.gate.e_score_correction_bias": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.0.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.0.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.1.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.1.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.2.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.2.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.3.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.3.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.4.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.4.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.5.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.5.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.6.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.6.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.7.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.7.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.8.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.8.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.9.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.9.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.10.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.10.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.11.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.11.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.12.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.12.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.13.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.13.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.14.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.14.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.15.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.15.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.16.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.16.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.17.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.17.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.18.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.18.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.19.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.19.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.20.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.20.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.21.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.21.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.22.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.22.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.23.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.23.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.24.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.24.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.25.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.25.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.26.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.26.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.27.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.27.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.28.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.28.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.29.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.29.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.30.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.30.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.31.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.31.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.32.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.32.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.33.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.33.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.34.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.34.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.35.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.35.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.36.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.36.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.37.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.37.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.38.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.38.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.39.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.39.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.40.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.40.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.41.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.41.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.42.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.42.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.43.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.43.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.44.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.44.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.45.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.45.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.46.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.46.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.47.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.47.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.48.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.48.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.49.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.49.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.50.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.50.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.51.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.51.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.52.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.52.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.53.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.53.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.54.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.54.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.55.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.55.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.56.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.56.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.57.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.57.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.58.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.58.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.59.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.59.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.60.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.60.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.61.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.61.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.62.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.62.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.63.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.63.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.64.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.64.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.65.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.65.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.66.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.66.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.67.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.67.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.68.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.68.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.69.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.69.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.70.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.70.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.71.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.71.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.72.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.72.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.73.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.73.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.74.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.74.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.75.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.75.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.76.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.76.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.77.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.77.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.78.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.78.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.79.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.79.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.80.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.80.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.81.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.81.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.82.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.82.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.83.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.83.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.84.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.84.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.85.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.85.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.86.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.86.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.87.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.87.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.88.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.88.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.89.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.89.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.90.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.90.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.91.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.91.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.92.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.92.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.93.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.93.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.94.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.94.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.95.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.95.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.96.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.96.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.97.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.97.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.98.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.98.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.99.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.99.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.100.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.100.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.101.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.101.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.102.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.102.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.103.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.103.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.104.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.104.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.105.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.105.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.106.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.106.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.107.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.107.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.108.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.108.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.109.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.109.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.110.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.110.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.111.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.111.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.112.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.112.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.113.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.113.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.114.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.114.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.115.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.115.up_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.116.gate_proj.weight": "model-00103-of-00132.safetensors", + "model.layers.73.mlp.experts.116.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.117.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.117.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.118.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.118.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.119.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.119.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.120.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.120.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.121.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.121.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.122.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.122.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.123.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.123.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.124.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.124.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.125.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.125.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.126.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.126.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.127.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.127.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.128.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.128.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.129.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.129.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.130.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.130.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.131.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.131.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.132.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.132.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.133.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.133.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.134.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.134.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.135.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.135.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.136.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.136.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.137.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.137.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.138.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.138.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.139.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.139.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.140.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.140.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.141.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.141.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.142.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.142.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.143.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.143.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.144.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.144.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.145.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.145.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.146.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.146.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.147.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.147.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.148.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.148.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.149.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.149.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.150.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.150.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.151.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.151.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.152.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.152.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.153.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.153.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.154.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.154.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.155.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.155.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.156.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.156.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.157.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.157.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.158.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.158.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.159.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.159.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.0.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.1.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.2.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.3.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.4.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.5.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.6.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.7.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.8.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.9.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.10.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.11.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.12.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.13.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.14.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.15.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.16.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.17.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.18.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.19.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.20.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.21.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.22.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.23.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.24.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.25.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.26.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.27.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.28.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.29.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.30.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.31.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.32.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.33.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.34.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.35.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.36.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.37.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.38.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.39.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.40.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.41.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.42.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.43.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.44.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.45.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.46.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.47.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.48.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.49.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.50.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.51.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.52.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.53.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.54.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.55.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.56.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.57.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.58.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.59.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.60.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.61.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.62.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.63.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.64.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.65.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.66.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.67.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.68.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.69.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.70.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.71.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.72.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.73.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.74.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.75.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.76.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.77.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.78.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.79.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.80.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.81.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.82.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.83.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.84.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.85.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.86.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.87.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.88.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.89.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.90.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.91.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.92.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.93.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.94.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.95.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.96.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.97.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.98.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.99.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.100.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.101.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.102.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.103.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.104.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.105.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.106.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.107.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.108.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.109.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.110.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.111.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.112.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.113.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.114.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.115.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.116.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.117.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.118.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.119.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.120.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.121.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.122.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.123.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.124.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.125.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.126.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.127.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.128.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.129.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.130.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.131.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.132.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.133.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.134.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.135.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.136.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.137.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.138.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.139.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.140.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.141.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.142.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.143.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.144.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.145.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.146.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.147.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.148.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.149.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.150.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.151.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.152.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.153.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.154.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.155.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.156.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.157.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.158.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.experts.159.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.shared_experts.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.shared_experts.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.73.mlp.shared_experts.down_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.self_attn.q_proj.bias": "model-00104-of-00132.safetensors", + "model.layers.74.self_attn.k_proj.bias": "model-00104-of-00132.safetensors", + "model.layers.74.self_attn.v_proj.bias": "model-00104-of-00132.safetensors", + "model.layers.74.self_attn.q_norm.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.0.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.0.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.1.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.1.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.2.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.2.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.3.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.3.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.4.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.4.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.5.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.5.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.6.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.6.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.7.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.7.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.8.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.8.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.9.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.9.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.10.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.10.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.11.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.11.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.12.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.12.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.13.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.13.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.14.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.14.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.15.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.15.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.16.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.16.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.17.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.17.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.18.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.18.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.19.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.19.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.20.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.20.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.21.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.21.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.22.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.22.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.23.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.23.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.24.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.24.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.25.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.25.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.26.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.26.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.27.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.27.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.28.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.28.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.29.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.29.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.30.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.30.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.31.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.31.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.32.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.32.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.33.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.33.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.34.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.34.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.35.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.35.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.36.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.36.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.37.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.37.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.38.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.38.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.39.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.39.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.40.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.40.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.41.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.41.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.42.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.42.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.43.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.43.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.44.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.44.up_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.45.gate_proj.weight": "model-00104-of-00132.safetensors", + "model.layers.74.mlp.experts.45.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.46.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.46.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.47.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.47.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.48.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.48.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.49.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.49.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.50.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.50.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.51.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.51.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.52.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.52.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.53.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.53.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.54.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.54.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.55.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.55.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.56.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.56.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.57.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.57.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.58.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.58.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.59.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.59.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.60.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.60.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.61.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.61.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.62.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.62.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.63.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.63.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.64.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.64.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.65.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.65.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.66.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.66.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.67.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.67.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.68.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.68.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.69.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.69.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.70.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.70.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.71.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.71.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.72.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.72.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.73.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.73.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.74.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.74.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.75.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.75.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.76.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.76.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.77.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.77.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.78.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.78.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.79.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.79.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.80.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.80.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.81.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.81.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.82.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.82.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.83.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.83.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.84.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.84.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.85.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.85.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.86.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.86.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.87.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.87.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.88.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.88.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.89.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.89.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.90.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.90.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.91.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.91.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.92.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.92.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.93.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.93.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.94.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.94.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.95.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.95.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.96.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.96.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.97.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.97.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.98.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.98.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.99.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.99.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.100.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.100.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.101.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.101.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.102.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.102.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.103.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.103.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.104.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.104.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.105.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.105.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.106.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.106.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.107.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.107.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.108.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.108.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.109.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.109.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.110.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.110.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.111.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.111.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.112.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.112.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.113.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.113.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.114.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.114.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.115.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.115.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.116.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.116.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.117.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.117.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.118.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.118.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.119.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.119.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.120.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.120.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.121.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.121.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.122.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.122.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.123.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.123.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.124.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.124.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.125.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.125.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.126.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.126.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.127.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.127.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.128.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.128.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.129.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.129.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.130.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.130.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.131.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.131.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.132.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.132.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.133.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.133.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.134.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.134.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.135.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.135.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.136.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.136.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.137.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.137.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.138.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.138.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.139.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.139.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.140.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.140.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.141.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.141.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.142.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.142.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.143.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.143.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.144.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.144.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.145.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.145.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.146.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.146.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.147.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.147.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.148.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.148.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.149.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.149.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.150.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.150.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.151.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.151.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.152.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.152.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.153.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.153.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.154.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.154.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.155.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.155.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.156.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.156.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.157.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.157.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.158.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.158.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.159.gate_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.159.up_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.0.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.1.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.2.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.3.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.4.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.5.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.6.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.7.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.8.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.9.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.10.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.11.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.12.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.13.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.14.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.15.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.16.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.17.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.18.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.19.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.20.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.21.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.22.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.23.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.24.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.25.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.26.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.27.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.28.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.29.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.30.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.31.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.32.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.33.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.34.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.35.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.36.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.37.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.38.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.39.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.40.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.41.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.42.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.43.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.44.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.45.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.46.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.47.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.48.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.49.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.50.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.51.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.52.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.53.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.54.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.55.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.56.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.57.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.58.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.59.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.60.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.61.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.62.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.63.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.64.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.65.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.66.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.67.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.68.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.69.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.70.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.71.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.72.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.73.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.74.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.75.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.76.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.77.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.78.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.79.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.80.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.81.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.82.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.83.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.84.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.85.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.86.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.87.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.88.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.89.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.90.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.91.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.92.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.93.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.94.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.95.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.96.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.97.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.98.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.99.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.100.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.101.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.102.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.103.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.104.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.105.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.106.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.107.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.108.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.109.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.110.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.111.down_proj.weight": "model-00105-of-00132.safetensors", + "model.layers.74.mlp.experts.112.down_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.74.mlp.experts.113.down_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.74.mlp.experts.114.down_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.74.mlp.experts.115.down_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.74.mlp.experts.116.down_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.74.mlp.experts.117.down_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.74.mlp.experts.118.down_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.74.mlp.experts.119.down_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.74.mlp.experts.120.down_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.74.mlp.experts.121.down_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.74.mlp.experts.122.down_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.74.mlp.experts.123.down_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.74.mlp.experts.124.down_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.74.mlp.experts.125.down_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.74.mlp.experts.126.down_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.74.mlp.experts.127.down_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.74.mlp.experts.128.down_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.74.mlp.experts.129.down_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.74.mlp.experts.130.down_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.74.mlp.experts.131.down_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.74.mlp.experts.132.down_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.74.mlp.experts.133.down_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.74.mlp.experts.134.down_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.74.mlp.experts.135.down_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.74.mlp.experts.136.down_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.74.mlp.experts.137.down_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.74.mlp.experts.138.down_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.74.mlp.experts.139.down_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.74.mlp.experts.140.down_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.74.mlp.experts.141.down_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.74.mlp.experts.142.down_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.74.mlp.experts.143.down_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.74.mlp.experts.144.down_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.74.mlp.experts.145.down_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.74.mlp.experts.146.down_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.74.mlp.experts.147.down_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.74.mlp.experts.148.down_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.74.mlp.experts.149.down_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.74.mlp.experts.150.down_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.74.mlp.experts.151.down_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.74.mlp.experts.152.down_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.74.mlp.experts.153.down_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.74.mlp.experts.154.down_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.74.mlp.experts.155.down_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.74.mlp.experts.156.down_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.74.mlp.experts.157.down_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.74.mlp.experts.158.down_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.74.mlp.experts.159.down_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.74.mlp.shared_experts.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.74.mlp.shared_experts.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.self_attn.o_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.self_attn.q_norm.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.gate.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.gate.e_score_correction_bias": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.0.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.0.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.1.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.1.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.2.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.2.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.3.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.3.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.4.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.4.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.5.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.5.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.6.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.6.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.7.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.7.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.8.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.8.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.9.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.9.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.10.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.10.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.11.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.11.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.12.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.12.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.13.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.13.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.14.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.14.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.15.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.15.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.16.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.16.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.17.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.17.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.18.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.18.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.19.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.19.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.20.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.20.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.21.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.21.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.22.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.22.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.23.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.23.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.24.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.24.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.25.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.25.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.26.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.26.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.27.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.27.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.28.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.28.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.29.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.29.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.30.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.30.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.31.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.31.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.32.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.32.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.33.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.33.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.34.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.34.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.35.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.35.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.36.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.36.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.37.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.37.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.38.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.38.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.39.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.39.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.40.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.40.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.41.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.41.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.42.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.42.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.43.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.43.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.44.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.44.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.45.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.45.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.46.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.46.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.47.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.47.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.48.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.48.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.49.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.49.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.50.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.50.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.51.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.51.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.52.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.52.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.53.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.53.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.54.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.54.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.55.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.55.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.56.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.56.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.57.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.57.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.58.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.58.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.59.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.59.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.60.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.60.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.61.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.61.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.62.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.62.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.63.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.63.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.64.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.64.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.65.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.65.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.66.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.66.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.67.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.67.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.68.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.68.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.69.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.69.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.70.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.70.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.71.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.71.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.72.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.72.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.73.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.73.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.74.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.74.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.75.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.75.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.76.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.76.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.77.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.77.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.78.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.78.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.79.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.79.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.80.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.80.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.81.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.81.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.82.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.82.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.83.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.83.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.84.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.84.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.85.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.85.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.86.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.86.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.87.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.87.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.88.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.88.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.89.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.89.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.90.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.90.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.91.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.91.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.92.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.92.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.93.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.93.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.94.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.94.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.95.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.95.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.96.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.96.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.97.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.97.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.98.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.98.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.99.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.99.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.100.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.100.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.101.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.101.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.102.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.102.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.103.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.103.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.104.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.104.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.105.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.105.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.106.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.106.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.107.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.107.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.108.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.108.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.109.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.109.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.110.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.110.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.111.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.111.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.112.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.112.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.113.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.113.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.114.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.114.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.115.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.115.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.116.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.116.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.117.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.117.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.118.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.118.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.119.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.119.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.120.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.120.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.121.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.121.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.122.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.122.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.123.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.123.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.124.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.124.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.125.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.125.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.126.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.126.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.127.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.127.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.128.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.128.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.129.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.129.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.130.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.130.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.131.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.131.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.132.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.132.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.133.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.133.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.134.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.134.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.135.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.135.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.136.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.136.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.137.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.137.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.138.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.138.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.139.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.139.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.140.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.140.up_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.141.gate_proj.weight": "model-00106-of-00132.safetensors", + "model.layers.75.mlp.experts.141.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.142.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.142.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.143.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.143.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.144.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.144.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.145.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.145.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.146.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.146.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.147.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.147.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.148.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.148.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.149.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.149.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.150.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.150.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.151.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.151.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.152.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.152.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.153.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.153.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.154.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.154.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.155.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.155.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.156.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.156.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.157.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.157.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.158.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.158.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.159.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.159.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.0.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.1.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.2.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.3.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.4.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.5.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.6.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.7.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.8.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.9.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.10.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.11.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.12.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.13.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.14.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.15.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.16.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.17.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.18.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.19.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.20.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.21.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.22.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.23.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.24.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.25.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.26.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.27.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.28.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.29.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.30.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.31.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.32.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.33.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.34.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.35.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.36.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.37.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.38.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.39.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.40.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.41.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.42.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.43.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.44.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.45.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.46.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.47.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.48.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.49.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.50.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.51.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.52.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.53.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.54.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.55.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.56.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.57.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.58.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.59.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.60.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.61.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.62.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.63.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.64.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.65.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.66.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.67.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.68.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.69.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.70.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.71.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.72.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.73.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.74.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.75.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.76.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.77.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.78.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.79.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.80.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.81.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.82.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.83.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.84.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.85.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.86.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.87.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.88.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.89.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.90.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.91.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.92.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.93.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.94.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.95.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.96.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.97.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.98.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.99.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.100.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.101.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.102.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.103.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.104.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.105.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.106.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.107.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.108.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.109.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.110.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.111.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.112.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.113.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.114.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.115.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.116.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.117.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.118.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.119.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.120.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.121.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.122.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.123.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.124.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.125.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.126.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.127.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.128.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.129.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.130.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.131.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.132.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.133.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.134.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.135.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.136.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.137.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.138.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.139.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.140.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.141.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.142.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.143.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.144.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.145.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.146.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.147.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.148.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.149.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.150.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.151.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.152.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.153.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.154.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.155.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.156.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.157.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.158.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.experts.159.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.shared_experts.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.shared_experts.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.75.mlp.shared_experts.down_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.self_attn.q_proj.bias": "model-00107-of-00132.safetensors", + "model.layers.76.self_attn.k_proj.bias": "model-00107-of-00132.safetensors", + "model.layers.76.self_attn.v_proj.bias": "model-00107-of-00132.safetensors", + "model.layers.76.self_attn.q_norm.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.0.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.0.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.1.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.1.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.2.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.2.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.3.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.3.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.4.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.4.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.5.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.5.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.6.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.6.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.7.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.7.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.8.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.8.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.9.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.9.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.10.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.10.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.11.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.11.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.12.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.12.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.13.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.13.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.14.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.14.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.15.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.15.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.16.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.16.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.17.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.17.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.18.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.18.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.19.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.19.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.20.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.20.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.21.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.21.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.22.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.22.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.23.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.23.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.24.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.24.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.25.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.25.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.26.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.26.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.27.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.27.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.28.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.28.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.29.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.29.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.30.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.30.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.31.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.31.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.32.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.32.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.33.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.33.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.34.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.34.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.35.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.35.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.36.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.36.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.37.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.37.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.38.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.38.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.39.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.39.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.40.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.40.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.41.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.41.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.42.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.42.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.43.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.43.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.44.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.44.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.45.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.45.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.46.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.46.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.47.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.47.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.48.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.48.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.49.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.49.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.50.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.50.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.51.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.51.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.52.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.52.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.53.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.53.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.54.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.54.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.55.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.55.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.56.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.56.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.57.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.57.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.58.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.58.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.59.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.59.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.60.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.60.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.61.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.61.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.62.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.62.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.63.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.63.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.64.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.64.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.65.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.65.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.66.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.66.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.67.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.67.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.68.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.68.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.69.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.69.up_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.70.gate_proj.weight": "model-00107-of-00132.safetensors", + "model.layers.76.mlp.experts.70.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.71.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.71.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.72.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.72.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.73.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.73.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.74.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.74.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.75.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.75.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.76.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.76.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.77.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.77.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.78.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.78.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.79.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.79.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.80.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.80.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.81.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.81.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.82.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.82.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.83.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.83.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.84.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.84.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.85.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.85.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.86.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.86.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.87.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.87.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.88.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.88.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.89.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.89.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.90.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.90.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.91.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.91.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.92.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.92.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.93.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.93.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.94.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.94.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.95.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.95.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.96.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.96.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.97.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.97.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.98.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.98.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.99.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.99.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.100.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.100.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.101.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.101.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.102.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.102.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.103.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.103.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.104.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.104.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.105.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.105.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.106.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.106.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.107.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.107.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.108.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.108.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.109.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.109.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.110.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.110.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.111.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.111.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.112.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.112.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.113.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.113.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.114.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.114.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.115.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.115.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.116.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.116.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.117.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.117.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.118.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.118.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.119.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.119.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.120.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.120.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.121.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.121.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.122.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.122.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.123.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.123.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.124.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.124.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.125.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.125.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.126.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.126.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.127.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.127.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.128.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.128.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.129.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.129.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.130.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.130.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.131.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.131.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.132.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.132.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.133.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.133.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.134.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.134.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.135.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.135.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.136.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.136.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.137.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.137.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.138.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.138.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.139.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.139.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.140.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.140.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.141.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.141.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.142.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.142.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.143.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.143.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.144.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.144.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.145.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.145.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.146.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.146.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.147.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.147.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.148.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.148.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.149.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.149.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.150.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.150.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.151.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.151.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.152.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.152.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.153.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.153.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.154.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.154.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.155.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.155.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.156.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.156.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.157.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.157.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.158.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.158.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.159.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.159.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.0.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.1.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.2.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.3.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.4.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.5.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.6.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.7.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.8.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.9.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.10.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.11.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.12.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.13.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.14.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.15.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.16.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.17.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.18.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.19.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.20.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.21.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.22.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.23.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.24.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.25.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.26.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.27.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.28.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.29.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.30.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.31.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.32.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.33.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.34.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.35.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.36.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.37.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.38.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.39.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.40.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.41.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.42.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.43.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.44.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.45.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.46.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.47.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.48.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.49.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.50.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.51.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.52.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.53.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.54.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.55.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.56.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.57.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.58.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.59.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.60.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.61.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.62.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.63.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.64.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.65.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.66.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.67.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.68.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.69.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.70.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.71.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.72.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.73.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.74.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.75.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.76.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.77.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.78.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.79.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.80.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.81.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.82.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.83.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.84.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.85.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.86.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.87.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.88.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.89.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.90.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.91.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.92.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.93.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.94.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.95.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.96.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.97.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.98.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.99.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.100.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.101.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.102.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.103.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.104.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.105.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.106.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.107.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.108.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.109.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.110.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.111.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.112.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.113.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.114.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.115.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.116.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.117.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.118.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.119.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.120.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.121.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.122.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.123.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.124.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.125.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.126.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.127.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.128.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.129.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.130.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.131.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.132.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.133.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.134.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.135.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.136.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.137.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.138.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.139.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.140.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.141.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.142.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.143.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.144.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.145.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.146.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.147.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.148.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.149.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.150.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.151.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.152.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.153.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.154.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.155.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.156.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.157.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.158.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.experts.159.down_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.shared_experts.gate_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.76.mlp.shared_experts.up_proj.weight": "model-00108-of-00132.safetensors", + "model.layers.77.self_attn.o_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.self_attn.q_norm.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.gate.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.gate.e_score_correction_bias": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.0.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.0.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.1.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.1.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.2.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.2.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.3.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.3.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.4.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.4.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.5.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.5.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.6.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.6.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.7.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.7.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.8.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.8.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.9.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.9.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.10.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.10.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.11.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.11.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.12.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.12.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.13.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.13.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.14.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.14.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.15.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.15.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.16.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.16.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.17.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.17.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.18.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.18.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.19.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.19.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.20.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.20.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.21.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.21.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.22.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.22.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.23.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.23.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.24.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.24.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.25.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.25.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.26.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.26.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.27.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.27.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.28.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.28.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.29.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.29.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.30.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.30.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.31.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.31.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.32.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.32.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.33.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.33.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.34.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.34.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.35.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.35.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.36.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.36.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.37.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.37.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.38.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.38.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.39.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.39.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.40.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.40.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.41.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.41.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.42.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.42.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.43.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.43.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.44.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.44.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.45.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.45.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.46.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.46.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.47.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.47.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.48.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.48.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.49.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.49.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.50.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.50.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.51.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.51.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.52.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.52.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.53.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.53.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.54.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.54.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.55.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.55.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.56.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.56.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.57.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.57.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.58.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.58.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.59.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.59.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.60.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.60.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.61.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.61.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.62.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.62.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.63.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.63.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.64.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.64.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.65.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.65.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.66.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.66.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.67.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.67.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.68.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.68.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.69.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.69.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.70.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.70.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.71.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.71.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.72.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.72.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.73.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.73.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.74.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.74.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.75.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.75.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.76.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.76.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.77.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.77.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.78.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.78.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.79.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.79.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.80.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.80.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.81.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.81.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.82.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.82.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.83.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.83.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.84.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.84.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.85.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.85.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.86.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.86.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.87.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.87.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.88.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.88.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.89.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.89.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.90.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.90.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.91.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.91.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.92.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.92.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.93.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.93.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.94.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.94.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.95.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.95.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.96.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.96.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.97.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.97.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.98.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.98.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.99.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.99.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.100.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.100.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.101.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.101.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.102.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.102.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.103.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.103.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.104.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.104.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.105.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.105.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.106.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.106.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.107.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.107.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.108.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.108.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.109.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.109.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.110.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.110.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.111.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.111.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.112.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.112.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.113.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.113.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.114.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.114.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.115.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.115.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.116.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.116.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.117.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.117.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.118.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.118.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.119.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.119.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.120.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.120.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.121.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.121.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.122.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.122.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.123.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.123.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.124.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.124.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.125.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.125.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.126.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.126.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.127.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.127.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.128.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.128.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.129.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.129.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.130.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.130.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.131.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.131.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.132.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.132.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.133.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.133.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.134.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.134.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.135.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.135.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.136.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.136.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.137.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.137.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.138.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.138.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.139.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.139.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.140.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.140.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.141.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.141.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.142.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.142.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.143.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.143.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.144.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.144.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.145.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.145.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.146.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.146.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.147.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.147.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.148.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.148.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.149.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.149.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.150.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.150.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.151.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.151.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.152.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.152.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.153.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.153.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.154.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.154.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.155.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.155.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.156.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.156.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.157.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.157.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.158.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.158.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.159.gate_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.159.up_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.0.down_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.1.down_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.2.down_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.3.down_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.4.down_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.5.down_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.6.down_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.7.down_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.8.down_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.9.down_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.10.down_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.11.down_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.12.down_proj.weight": "model-00109-of-00132.safetensors", + "model.layers.77.mlp.experts.13.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.14.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.15.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.16.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.17.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.18.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.19.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.20.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.21.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.22.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.23.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.24.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.25.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.26.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.27.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.28.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.29.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.30.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.31.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.32.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.33.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.34.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.35.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.36.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.37.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.38.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.39.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.40.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.41.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.42.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.43.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.44.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.45.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.46.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.47.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.48.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.49.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.50.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.51.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.52.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.53.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.54.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.55.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.56.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.57.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.58.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.59.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.60.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.61.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.62.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.63.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.64.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.65.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.66.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.67.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.68.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.69.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.70.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.71.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.72.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.73.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.74.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.75.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.76.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.77.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.78.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.79.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.80.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.81.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.82.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.83.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.84.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.85.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.86.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.87.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.88.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.89.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.90.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.91.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.92.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.93.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.94.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.95.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.96.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.97.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.98.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.99.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.100.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.101.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.102.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.103.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.104.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.105.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.106.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.107.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.108.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.109.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.110.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.111.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.112.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.113.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.114.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.115.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.116.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.117.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.118.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.119.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.120.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.121.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.122.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.123.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.124.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.125.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.126.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.127.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.128.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.129.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.130.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.131.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.132.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.133.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.134.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.135.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.136.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.137.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.138.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.139.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.140.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.141.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.142.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.143.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.144.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.145.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.146.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.147.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.148.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.149.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.150.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.151.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.152.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.153.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.154.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.155.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.156.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.157.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.158.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.experts.159.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.shared_experts.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.shared_experts.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.77.mlp.shared_experts.down_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.self_attn.q_proj.bias": "model-00110-of-00132.safetensors", + "model.layers.78.self_attn.k_proj.bias": "model-00110-of-00132.safetensors", + "model.layers.78.self_attn.v_proj.bias": "model-00110-of-00132.safetensors", + "model.layers.78.self_attn.q_norm.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.0.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.0.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.1.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.1.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.2.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.2.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.3.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.3.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.4.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.4.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.5.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.5.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.6.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.6.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.7.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.7.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.8.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.8.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.9.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.9.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.10.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.10.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.11.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.11.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.12.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.12.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.13.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.13.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.14.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.14.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.15.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.15.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.16.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.16.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.17.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.17.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.18.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.18.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.19.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.19.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.20.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.20.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.21.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.21.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.22.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.22.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.23.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.23.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.24.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.24.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.25.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.25.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.26.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.26.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.27.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.27.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.28.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.28.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.29.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.29.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.30.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.30.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.31.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.31.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.32.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.32.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.33.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.33.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.34.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.34.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.35.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.35.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.36.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.36.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.37.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.37.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.38.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.38.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.39.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.39.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.40.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.40.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.41.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.41.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.42.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.42.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.43.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.43.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.44.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.44.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.45.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.45.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.46.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.46.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.47.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.47.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.48.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.48.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.49.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.49.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.50.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.50.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.51.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.51.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.52.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.52.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.53.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.53.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.54.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.54.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.55.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.55.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.56.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.56.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.57.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.57.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.58.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.58.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.59.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.59.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.60.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.60.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.61.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.61.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.62.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.62.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.63.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.63.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.64.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.64.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.65.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.65.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.66.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.66.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.67.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.67.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.68.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.68.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.69.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.69.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.70.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.70.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.71.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.71.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.72.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.72.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.73.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.73.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.74.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.74.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.75.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.75.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.76.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.76.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.77.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.77.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.78.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.78.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.79.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.79.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.80.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.80.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.81.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.81.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.82.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.82.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.83.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.83.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.84.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.84.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.85.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.85.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.86.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.86.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.87.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.87.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.88.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.88.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.89.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.89.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.90.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.90.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.91.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.91.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.92.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.92.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.93.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.93.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.94.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.94.up_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.95.gate_proj.weight": "model-00110-of-00132.safetensors", + "model.layers.78.mlp.experts.95.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.96.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.96.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.97.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.97.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.98.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.98.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.99.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.99.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.100.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.100.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.101.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.101.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.102.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.102.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.103.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.103.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.104.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.104.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.105.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.105.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.106.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.106.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.107.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.107.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.108.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.108.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.109.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.109.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.110.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.110.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.111.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.111.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.112.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.112.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.113.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.113.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.114.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.114.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.115.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.115.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.116.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.116.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.117.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.117.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.118.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.118.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.119.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.119.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.120.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.120.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.121.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.121.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.122.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.122.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.123.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.123.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.124.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.124.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.125.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.125.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.126.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.126.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.127.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.127.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.128.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.128.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.129.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.129.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.130.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.130.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.131.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.131.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.132.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.132.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.133.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.133.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.134.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.134.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.135.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.135.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.136.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.136.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.137.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.137.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.138.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.138.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.139.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.139.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.140.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.140.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.141.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.141.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.142.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.142.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.143.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.143.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.144.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.144.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.145.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.145.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.146.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.146.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.147.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.147.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.148.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.148.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.149.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.149.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.150.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.150.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.151.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.151.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.152.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.152.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.153.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.153.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.154.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.154.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.155.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.155.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.156.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.156.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.157.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.157.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.158.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.158.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.159.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.159.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.0.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.1.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.2.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.3.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.4.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.5.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.6.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.7.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.8.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.9.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.10.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.11.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.12.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.13.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.14.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.15.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.16.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.17.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.18.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.19.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.20.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.21.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.22.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.23.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.24.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.25.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.26.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.27.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.28.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.29.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.30.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.31.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.32.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.33.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.34.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.35.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.36.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.37.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.38.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.39.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.40.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.41.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.42.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.43.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.44.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.45.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.46.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.47.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.48.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.49.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.50.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.51.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.52.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.53.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.54.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.55.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.56.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.57.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.58.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.59.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.60.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.61.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.62.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.63.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.64.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.65.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.66.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.67.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.68.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.69.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.70.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.71.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.72.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.73.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.74.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.75.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.76.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.77.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.78.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.79.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.80.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.81.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.82.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.83.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.84.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.85.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.86.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.87.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.88.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.89.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.90.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.91.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.92.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.93.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.94.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.95.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.96.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.97.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.98.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.99.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.100.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.101.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.102.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.103.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.104.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.105.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.106.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.107.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.108.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.109.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.110.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.111.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.112.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.113.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.114.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.115.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.116.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.117.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.118.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.119.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.120.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.121.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.122.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.123.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.124.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.125.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.126.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.127.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.128.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.129.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.130.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.131.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.132.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.133.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.134.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.135.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.136.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.137.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.138.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.139.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.140.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.141.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.142.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.143.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.144.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.145.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.146.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.147.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.148.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.149.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.150.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.151.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.152.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.153.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.154.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.155.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.156.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.157.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.158.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.experts.159.down_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.shared_experts.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.78.mlp.shared_experts.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.79.self_attn.o_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.79.self_attn.q_norm.weight": "model-00111-of-00132.safetensors", + "model.layers.79.mlp.gate.weight": "model-00111-of-00132.safetensors", + "model.layers.79.mlp.gate.e_score_correction_bias": "model-00111-of-00132.safetensors", + "model.layers.79.mlp.experts.0.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.79.mlp.experts.0.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.79.mlp.experts.1.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.79.mlp.experts.1.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.79.mlp.experts.2.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.79.mlp.experts.2.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.79.mlp.experts.3.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.79.mlp.experts.3.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.79.mlp.experts.4.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.79.mlp.experts.4.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.79.mlp.experts.5.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.79.mlp.experts.5.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.79.mlp.experts.6.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.79.mlp.experts.6.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.79.mlp.experts.7.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.79.mlp.experts.7.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.79.mlp.experts.8.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.79.mlp.experts.8.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.79.mlp.experts.9.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.79.mlp.experts.9.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.79.mlp.experts.10.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.79.mlp.experts.10.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.79.mlp.experts.11.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.79.mlp.experts.11.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.79.mlp.experts.12.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.79.mlp.experts.12.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.79.mlp.experts.13.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.79.mlp.experts.13.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.79.mlp.experts.14.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.79.mlp.experts.14.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.79.mlp.experts.15.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.79.mlp.experts.15.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.79.mlp.experts.16.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.79.mlp.experts.16.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.79.mlp.experts.17.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.79.mlp.experts.17.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.79.mlp.experts.18.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.79.mlp.experts.18.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.79.mlp.experts.19.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.79.mlp.experts.19.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.79.mlp.experts.20.gate_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.79.mlp.experts.20.up_proj.weight": "model-00111-of-00132.safetensors", + "model.layers.79.mlp.experts.21.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.21.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.22.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.22.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.23.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.23.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.24.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.24.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.25.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.25.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.26.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.26.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.27.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.27.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.28.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.28.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.29.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.29.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.30.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.30.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.31.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.31.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.32.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.32.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.33.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.33.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.34.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.34.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.35.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.35.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.36.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.36.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.37.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.37.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.38.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.38.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.39.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.39.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.40.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.40.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.41.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.41.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.42.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.42.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.43.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.43.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.44.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.44.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.45.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.45.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.46.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.46.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.47.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.47.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.48.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.48.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.49.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.49.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.50.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.50.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.51.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.51.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.52.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.52.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.53.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.53.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.54.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.54.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.55.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.55.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.56.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.56.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.57.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.57.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.58.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.58.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.59.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.59.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.60.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.60.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.61.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.61.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.62.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.62.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.63.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.63.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.64.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.64.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.65.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.65.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.66.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.66.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.67.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.67.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.68.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.68.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.69.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.69.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.70.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.70.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.71.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.71.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.72.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.72.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.73.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.73.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.74.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.74.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.75.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.75.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.76.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.76.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.77.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.77.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.78.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.78.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.79.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.79.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.80.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.80.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.81.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.81.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.82.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.82.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.83.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.83.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.84.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.84.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.85.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.85.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.86.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.86.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.87.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.87.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.88.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.88.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.89.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.89.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.90.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.90.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.91.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.91.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.92.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.92.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.93.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.93.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.94.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.94.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.95.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.95.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.96.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.96.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.97.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.97.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.98.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.98.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.99.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.99.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.100.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.100.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.101.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.101.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.102.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.102.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.103.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.103.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.104.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.104.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.105.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.105.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.106.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.106.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.107.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.107.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.108.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.108.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.109.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.109.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.110.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.110.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.111.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.111.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.112.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.112.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.113.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.113.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.114.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.114.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.115.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.115.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.116.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.116.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.117.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.117.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.118.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.118.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.119.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.119.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.120.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.120.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.121.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.121.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.122.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.122.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.123.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.123.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.124.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.124.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.125.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.125.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.126.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.126.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.127.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.127.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.128.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.128.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.129.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.129.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.130.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.130.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.131.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.131.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.132.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.132.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.133.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.133.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.134.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.134.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.135.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.135.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.136.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.136.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.137.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.137.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.138.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.138.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.139.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.139.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.140.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.140.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.141.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.141.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.142.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.142.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.143.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.143.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.144.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.144.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.145.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.145.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.146.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.146.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.147.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.147.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.148.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.148.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.149.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.149.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.150.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.150.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.151.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.151.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.152.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.152.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.153.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.153.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.154.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.154.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.155.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.155.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.156.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.156.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.157.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.157.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.158.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.158.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.159.gate_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.159.up_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.0.down_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.1.down_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.2.down_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.3.down_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.4.down_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.5.down_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.6.down_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.7.down_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.8.down_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.9.down_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.10.down_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.11.down_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.12.down_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.13.down_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.14.down_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.15.down_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.16.down_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.17.down_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.18.down_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.19.down_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.20.down_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.21.down_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.22.down_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.23.down_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.24.down_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.25.down_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.26.down_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.27.down_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.28.down_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.29.down_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.30.down_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.31.down_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.32.down_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.33.down_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.34.down_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.35.down_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.36.down_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.37.down_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.38.down_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.39.down_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.40.down_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.41.down_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.42.down_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.43.down_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.44.down_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.45.down_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.46.down_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.47.down_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.48.down_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.49.down_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.50.down_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.51.down_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.52.down_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.53.down_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.54.down_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.55.down_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.56.down_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.57.down_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.58.down_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.59.down_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.60.down_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.61.down_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.62.down_proj.weight": "model-00112-of-00132.safetensors", + "model.layers.79.mlp.experts.63.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.64.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.65.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.66.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.67.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.68.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.69.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.70.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.71.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.72.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.73.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.74.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.75.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.76.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.77.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.78.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.79.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.80.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.81.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.82.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.83.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.84.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.85.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.86.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.87.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.88.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.89.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.90.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.91.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.92.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.93.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.94.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.95.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.96.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.97.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.98.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.99.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.100.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.101.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.102.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.103.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.104.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.105.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.106.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.107.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.108.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.109.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.110.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.111.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.112.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.113.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.114.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.115.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.116.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.117.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.118.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.119.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.120.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.121.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.122.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.123.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.124.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.125.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.126.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.127.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.128.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.129.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.130.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.131.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.132.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.133.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.134.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.135.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.136.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.137.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.138.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.139.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.140.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.141.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.142.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.143.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.144.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.145.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.146.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.147.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.148.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.149.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.150.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.151.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.152.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.153.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.154.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.155.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.156.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.157.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.158.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.experts.159.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.shared_experts.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.shared_experts.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.79.mlp.shared_experts.down_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.self_attn.q_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.self_attn.k_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.self_attn.v_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.self_attn.q_proj.bias": "model-00113-of-00132.safetensors", + "model.layers.80.self_attn.k_proj.bias": "model-00113-of-00132.safetensors", + "model.layers.80.self_attn.v_proj.bias": "model-00113-of-00132.safetensors", + "model.layers.80.self_attn.q_norm.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.0.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.0.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.1.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.1.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.2.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.2.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.3.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.3.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.4.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.4.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.5.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.5.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.6.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.6.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.7.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.7.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.8.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.8.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.9.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.9.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.10.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.10.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.11.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.11.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.12.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.12.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.13.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.13.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.14.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.14.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.15.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.15.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.16.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.16.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.17.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.17.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.18.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.18.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.19.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.19.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.20.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.20.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.21.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.21.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.22.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.22.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.23.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.23.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.24.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.24.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.25.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.25.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.26.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.26.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.27.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.27.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.28.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.28.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.29.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.29.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.30.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.30.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.31.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.31.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.32.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.32.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.33.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.33.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.34.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.34.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.35.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.35.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.36.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.36.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.37.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.37.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.38.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.38.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.39.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.39.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.40.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.40.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.41.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.41.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.42.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.42.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.43.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.43.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.44.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.44.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.45.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.45.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.46.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.46.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.47.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.47.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.48.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.48.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.49.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.49.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.50.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.50.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.51.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.51.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.52.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.52.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.53.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.53.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.54.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.54.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.55.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.55.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.56.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.56.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.57.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.57.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.58.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.58.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.59.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.59.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.60.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.60.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.61.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.61.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.62.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.62.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.63.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.63.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.64.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.64.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.65.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.65.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.66.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.66.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.67.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.67.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.68.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.68.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.69.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.69.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.70.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.70.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.71.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.71.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.72.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.72.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.73.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.73.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.74.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.74.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.75.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.75.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.76.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.76.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.77.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.77.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.78.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.78.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.79.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.79.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.80.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.80.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.81.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.81.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.82.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.82.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.83.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.83.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.84.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.84.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.85.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.85.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.86.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.86.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.87.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.87.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.88.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.88.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.89.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.89.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.90.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.90.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.91.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.91.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.92.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.92.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.93.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.93.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.94.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.94.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.95.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.95.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.96.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.96.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.97.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.97.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.98.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.98.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.99.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.99.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.100.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.100.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.101.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.101.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.102.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.102.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.103.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.103.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.104.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.104.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.105.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.105.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.106.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.106.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.107.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.107.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.108.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.108.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.109.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.109.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.110.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.110.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.111.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.111.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.112.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.112.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.113.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.113.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.114.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.114.up_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.115.gate_proj.weight": "model-00113-of-00132.safetensors", + "model.layers.80.mlp.experts.115.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.116.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.116.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.117.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.117.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.118.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.118.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.119.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.119.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.120.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.120.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.121.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.121.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.122.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.122.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.123.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.123.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.124.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.124.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.125.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.125.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.126.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.126.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.127.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.127.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.128.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.128.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.129.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.129.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.130.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.130.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.131.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.131.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.132.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.132.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.133.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.133.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.134.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.134.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.135.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.135.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.136.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.136.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.137.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.137.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.138.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.138.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.139.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.139.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.140.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.140.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.141.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.141.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.142.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.142.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.143.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.143.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.144.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.144.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.145.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.145.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.146.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.146.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.147.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.147.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.148.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.148.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.149.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.149.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.150.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.150.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.151.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.151.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.152.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.152.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.153.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.153.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.154.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.154.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.155.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.155.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.156.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.156.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.157.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.157.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.158.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.158.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.159.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.159.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.0.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.1.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.2.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.3.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.4.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.5.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.6.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.7.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.8.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.9.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.10.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.11.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.12.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.13.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.14.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.15.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.16.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.17.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.18.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.19.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.20.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.21.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.22.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.23.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.24.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.25.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.26.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.27.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.28.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.29.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.30.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.31.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.32.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.33.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.34.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.35.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.36.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.37.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.38.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.39.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.40.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.41.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.42.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.43.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.44.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.45.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.46.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.47.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.48.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.49.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.50.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.51.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.52.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.53.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.54.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.55.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.56.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.57.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.58.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.59.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.60.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.61.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.62.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.63.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.64.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.65.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.66.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.67.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.68.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.69.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.70.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.71.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.72.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.73.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.74.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.75.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.76.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.77.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.78.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.79.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.80.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.81.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.82.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.83.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.84.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.85.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.86.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.87.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.88.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.89.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.90.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.91.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.92.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.93.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.94.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.95.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.96.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.97.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.98.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.99.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.100.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.101.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.102.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.103.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.104.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.105.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.106.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.107.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.108.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.109.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.110.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.111.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.112.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.113.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.114.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.115.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.116.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.117.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.118.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.119.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.120.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.121.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.122.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.123.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.124.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.125.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.126.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.127.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.128.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.129.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.130.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.131.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.132.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.133.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.134.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.135.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.136.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.137.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.138.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.139.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.140.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.141.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.142.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.143.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.144.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.145.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.146.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.147.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.148.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.149.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.150.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.151.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.152.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.153.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.154.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.155.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.156.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.157.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.158.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.experts.159.down_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.shared_experts.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.80.mlp.shared_experts.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.81.self_attn.o_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.81.self_attn.q_norm.weight": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.gate.weight": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.gate.e_score_correction_bias": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.experts.0.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.experts.0.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.experts.1.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.experts.1.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.experts.2.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.experts.2.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.experts.3.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.experts.3.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.experts.4.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.experts.4.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.experts.5.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.experts.5.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.experts.6.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.experts.6.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.experts.7.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.experts.7.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.experts.8.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.experts.8.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.experts.9.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.experts.9.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.experts.10.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.experts.10.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.experts.11.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.experts.11.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.experts.12.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.experts.12.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.experts.13.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.experts.13.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.experts.14.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.experts.14.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.experts.15.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.experts.15.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.experts.16.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.experts.16.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.experts.17.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.experts.17.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.experts.18.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.experts.18.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.experts.19.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.experts.19.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.experts.20.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.experts.20.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.experts.21.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.experts.21.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.experts.22.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.experts.22.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.experts.23.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.experts.23.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.experts.24.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.experts.24.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.experts.25.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.experts.25.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.experts.26.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.experts.26.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.experts.27.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.experts.27.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.experts.28.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.experts.28.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.experts.29.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.experts.29.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.experts.30.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.experts.30.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.experts.31.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.experts.31.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.experts.32.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.experts.32.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.experts.33.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.experts.33.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.experts.34.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.experts.34.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.experts.35.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.experts.35.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.experts.36.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.experts.36.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.experts.37.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.experts.37.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.experts.38.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.experts.38.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.experts.39.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.experts.39.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.experts.40.gate_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.experts.40.up_proj.weight": "model-00114-of-00132.safetensors", + "model.layers.81.mlp.experts.41.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.41.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.42.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.42.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.43.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.43.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.44.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.44.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.45.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.45.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.46.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.46.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.47.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.47.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.48.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.48.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.49.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.49.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.50.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.50.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.51.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.51.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.52.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.52.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.53.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.53.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.54.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.54.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.55.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.55.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.56.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.56.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.57.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.57.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.58.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.58.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.59.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.59.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.60.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.60.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.61.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.61.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.62.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.62.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.63.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.63.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.64.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.64.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.65.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.65.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.66.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.66.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.67.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.67.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.68.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.68.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.69.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.69.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.70.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.70.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.71.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.71.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.72.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.72.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.73.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.73.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.74.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.74.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.75.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.75.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.76.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.76.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.77.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.77.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.78.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.78.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.79.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.79.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.80.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.80.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.81.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.81.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.82.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.82.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.83.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.83.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.84.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.84.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.85.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.85.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.86.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.86.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.87.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.87.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.88.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.88.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.89.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.89.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.90.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.90.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.91.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.91.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.92.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.92.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.93.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.93.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.94.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.94.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.95.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.95.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.96.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.96.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.97.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.97.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.98.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.98.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.99.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.99.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.100.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.100.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.101.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.101.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.102.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.102.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.103.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.103.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.104.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.104.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.105.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.105.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.106.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.106.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.107.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.107.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.108.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.108.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.109.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.109.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.110.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.110.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.111.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.111.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.112.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.112.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.113.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.113.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.114.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.114.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.115.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.115.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.116.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.116.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.117.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.117.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.118.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.118.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.119.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.119.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.120.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.120.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.121.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.121.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.122.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.122.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.123.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.123.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.124.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.124.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.125.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.125.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.126.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.126.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.127.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.127.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.128.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.128.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.129.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.129.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.130.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.130.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.131.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.131.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.132.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.132.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.133.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.133.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.134.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.134.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.135.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.135.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.136.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.136.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.137.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.137.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.138.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.138.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.139.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.139.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.140.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.140.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.141.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.141.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.142.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.142.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.143.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.143.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.144.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.144.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.145.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.145.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.146.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.146.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.147.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.147.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.148.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.148.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.149.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.149.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.150.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.150.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.151.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.151.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.152.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.152.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.153.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.153.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.154.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.154.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.155.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.155.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.156.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.156.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.157.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.157.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.158.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.158.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.159.gate_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.159.up_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.0.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.1.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.2.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.3.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.4.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.5.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.6.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.7.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.8.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.9.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.10.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.11.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.12.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.13.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.14.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.15.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.16.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.17.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.18.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.19.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.20.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.21.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.22.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.23.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.24.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.25.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.26.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.27.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.28.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.29.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.30.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.31.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.32.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.33.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.34.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.35.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.36.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.37.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.38.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.39.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.40.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.41.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.42.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.43.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.44.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.45.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.46.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.47.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.48.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.49.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.50.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.51.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.52.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.53.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.54.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.55.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.56.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.57.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.58.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.59.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.60.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.61.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.62.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.63.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.64.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.65.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.66.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.67.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.68.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.69.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.70.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.71.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.72.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.73.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.74.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.75.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.76.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.77.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.78.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.79.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.80.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.81.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.82.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.83.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.84.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.85.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.86.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.87.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.88.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.89.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.90.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.91.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.92.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.93.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.94.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.95.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.96.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.97.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.98.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.99.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.100.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.101.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.102.down_proj.weight": "model-00115-of-00132.safetensors", + "model.layers.81.mlp.experts.103.down_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.81.mlp.experts.104.down_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.81.mlp.experts.105.down_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.81.mlp.experts.106.down_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.81.mlp.experts.107.down_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.81.mlp.experts.108.down_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.81.mlp.experts.109.down_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.81.mlp.experts.110.down_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.81.mlp.experts.111.down_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.81.mlp.experts.112.down_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.81.mlp.experts.113.down_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.81.mlp.experts.114.down_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.81.mlp.experts.115.down_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.81.mlp.experts.116.down_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.81.mlp.experts.117.down_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.81.mlp.experts.118.down_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.81.mlp.experts.119.down_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.81.mlp.experts.120.down_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.81.mlp.experts.121.down_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.81.mlp.experts.122.down_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.81.mlp.experts.123.down_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.81.mlp.experts.124.down_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.81.mlp.experts.125.down_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.81.mlp.experts.126.down_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.81.mlp.experts.127.down_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.81.mlp.experts.128.down_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.81.mlp.experts.129.down_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.81.mlp.experts.130.down_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.81.mlp.experts.131.down_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.81.mlp.experts.132.down_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.81.mlp.experts.133.down_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.81.mlp.experts.134.down_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.81.mlp.experts.135.down_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.81.mlp.experts.136.down_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.81.mlp.experts.137.down_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.81.mlp.experts.138.down_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.81.mlp.experts.139.down_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.81.mlp.experts.140.down_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.81.mlp.experts.141.down_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.81.mlp.experts.142.down_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.81.mlp.experts.143.down_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.81.mlp.experts.144.down_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.81.mlp.experts.145.down_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.81.mlp.experts.146.down_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.81.mlp.experts.147.down_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.81.mlp.experts.148.down_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.81.mlp.experts.149.down_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.81.mlp.experts.150.down_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.81.mlp.experts.151.down_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.81.mlp.experts.152.down_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.81.mlp.experts.153.down_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.81.mlp.experts.154.down_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.81.mlp.experts.155.down_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.81.mlp.experts.156.down_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.81.mlp.experts.157.down_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.81.mlp.experts.158.down_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.81.mlp.experts.159.down_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.81.mlp.shared_experts.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.81.mlp.shared_experts.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.81.mlp.shared_experts.down_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.self_attn.q_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.self_attn.k_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.self_attn.v_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.self_attn.q_proj.bias": "model-00116-of-00132.safetensors", + "model.layers.82.self_attn.k_proj.bias": "model-00116-of-00132.safetensors", + "model.layers.82.self_attn.v_proj.bias": "model-00116-of-00132.safetensors", + "model.layers.82.self_attn.q_norm.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.0.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.0.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.1.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.1.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.2.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.2.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.3.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.3.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.4.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.4.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.5.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.5.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.6.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.6.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.7.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.7.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.8.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.8.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.9.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.9.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.10.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.10.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.11.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.11.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.12.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.12.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.13.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.13.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.14.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.14.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.15.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.15.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.16.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.16.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.17.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.17.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.18.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.18.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.19.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.19.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.20.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.20.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.21.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.21.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.22.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.22.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.23.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.23.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.24.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.24.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.25.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.25.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.26.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.26.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.27.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.27.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.28.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.28.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.29.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.29.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.30.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.30.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.31.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.31.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.32.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.32.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.33.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.33.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.34.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.34.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.35.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.35.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.36.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.36.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.37.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.37.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.38.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.38.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.39.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.39.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.40.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.40.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.41.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.41.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.42.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.42.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.43.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.43.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.44.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.44.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.45.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.45.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.46.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.46.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.47.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.47.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.48.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.48.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.49.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.49.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.50.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.50.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.51.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.51.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.52.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.52.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.53.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.53.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.54.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.54.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.55.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.55.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.56.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.56.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.57.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.57.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.58.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.58.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.59.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.59.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.60.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.60.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.61.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.61.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.62.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.62.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.63.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.63.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.64.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.64.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.65.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.65.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.66.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.66.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.67.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.67.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.68.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.68.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.69.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.69.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.70.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.70.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.71.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.71.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.72.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.72.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.73.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.73.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.74.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.74.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.75.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.75.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.76.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.76.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.77.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.77.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.78.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.78.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.79.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.79.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.80.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.80.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.81.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.81.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.82.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.82.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.83.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.83.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.84.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.84.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.85.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.85.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.86.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.86.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.87.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.87.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.88.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.88.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.89.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.89.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.90.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.90.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.91.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.91.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.92.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.92.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.93.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.93.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.94.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.94.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.95.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.95.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.96.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.96.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.97.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.97.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.98.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.98.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.99.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.99.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.100.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.100.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.101.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.101.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.102.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.102.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.103.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.103.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.104.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.104.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.105.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.105.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.106.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.106.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.107.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.107.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.108.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.108.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.109.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.109.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.110.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.110.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.111.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.111.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.112.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.112.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.113.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.113.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.114.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.114.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.115.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.115.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.116.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.116.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.117.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.117.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.118.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.118.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.119.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.119.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.120.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.120.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.121.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.121.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.122.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.122.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.123.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.123.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.124.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.124.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.125.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.125.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.126.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.126.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.127.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.127.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.128.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.128.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.129.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.129.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.130.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.130.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.131.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.131.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.132.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.132.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.133.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.133.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.134.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.134.up_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.135.gate_proj.weight": "model-00116-of-00132.safetensors", + "model.layers.82.mlp.experts.135.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.136.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.136.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.137.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.137.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.138.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.138.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.139.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.139.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.140.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.140.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.141.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.141.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.142.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.142.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.143.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.143.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.144.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.144.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.145.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.145.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.146.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.146.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.147.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.147.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.148.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.148.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.149.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.149.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.150.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.150.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.151.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.151.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.152.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.152.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.153.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.153.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.154.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.154.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.155.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.155.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.156.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.156.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.157.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.157.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.158.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.158.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.159.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.159.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.0.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.1.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.2.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.3.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.4.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.5.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.6.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.7.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.8.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.9.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.10.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.11.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.12.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.13.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.14.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.15.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.16.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.17.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.18.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.19.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.20.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.21.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.22.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.23.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.24.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.25.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.26.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.27.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.28.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.29.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.30.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.31.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.32.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.33.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.34.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.35.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.36.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.37.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.38.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.39.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.40.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.41.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.42.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.43.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.44.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.45.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.46.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.47.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.48.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.49.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.50.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.51.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.52.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.53.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.54.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.55.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.56.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.57.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.58.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.59.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.60.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.61.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.62.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.63.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.64.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.65.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.66.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.67.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.68.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.69.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.70.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.71.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.72.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.73.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.74.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.75.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.76.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.77.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.78.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.79.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.80.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.81.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.82.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.83.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.84.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.85.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.86.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.87.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.88.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.89.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.90.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.91.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.92.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.93.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.94.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.95.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.96.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.97.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.98.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.99.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.100.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.101.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.102.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.103.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.104.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.105.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.106.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.107.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.108.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.109.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.110.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.111.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.112.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.113.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.114.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.115.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.116.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.117.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.118.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.119.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.120.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.121.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.122.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.123.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.124.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.125.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.126.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.127.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.128.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.129.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.130.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.131.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.132.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.133.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.134.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.135.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.136.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.137.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.138.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.139.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.140.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.141.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.142.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.143.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.144.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.145.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.146.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.147.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.148.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.149.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.150.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.151.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.152.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.153.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.154.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.155.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.156.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.157.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.158.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.experts.159.down_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.shared_experts.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.82.mlp.shared_experts.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.self_attn.o_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.self_attn.q_norm.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.gate.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.gate.e_score_correction_bias": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.0.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.0.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.1.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.1.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.2.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.2.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.3.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.3.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.4.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.4.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.5.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.5.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.6.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.6.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.7.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.7.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.8.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.8.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.9.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.9.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.10.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.10.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.11.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.11.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.12.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.12.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.13.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.13.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.14.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.14.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.15.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.15.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.16.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.16.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.17.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.17.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.18.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.18.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.19.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.19.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.20.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.20.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.21.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.21.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.22.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.22.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.23.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.23.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.24.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.24.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.25.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.25.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.26.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.26.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.27.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.27.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.28.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.28.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.29.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.29.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.30.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.30.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.31.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.31.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.32.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.32.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.33.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.33.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.34.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.34.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.35.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.35.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.36.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.36.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.37.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.37.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.38.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.38.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.39.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.39.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.40.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.40.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.41.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.41.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.42.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.42.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.43.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.43.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.44.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.44.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.45.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.45.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.46.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.46.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.47.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.47.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.48.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.48.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.49.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.49.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.50.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.50.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.51.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.51.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.52.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.52.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.53.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.53.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.54.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.54.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.55.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.55.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.56.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.56.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.57.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.57.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.58.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.58.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.59.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.59.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.60.gate_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.60.up_proj.weight": "model-00117-of-00132.safetensors", + "model.layers.83.mlp.experts.61.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.61.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.62.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.62.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.63.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.63.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.64.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.64.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.65.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.65.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.66.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.66.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.67.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.67.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.68.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.68.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.69.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.69.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.70.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.70.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.71.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.71.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.72.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.72.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.73.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.73.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.74.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.74.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.75.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.75.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.76.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.76.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.77.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.77.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.78.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.78.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.79.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.79.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.80.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.80.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.81.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.81.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.82.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.82.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.83.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.83.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.84.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.84.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.85.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.85.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.86.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.86.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.87.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.87.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.88.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.88.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.89.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.89.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.90.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.90.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.91.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.91.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.92.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.92.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.93.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.93.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.94.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.94.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.95.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.95.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.96.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.96.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.97.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.97.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.98.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.98.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.99.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.99.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.100.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.100.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.101.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.101.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.102.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.102.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.103.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.103.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.104.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.104.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.105.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.105.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.106.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.106.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.107.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.107.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.108.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.108.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.109.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.109.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.110.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.110.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.111.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.111.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.112.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.112.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.113.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.113.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.114.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.114.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.115.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.115.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.116.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.116.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.117.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.117.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.118.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.118.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.119.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.119.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.120.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.120.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.121.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.121.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.122.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.122.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.123.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.123.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.124.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.124.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.125.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.125.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.126.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.126.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.127.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.127.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.128.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.128.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.129.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.129.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.130.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.130.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.131.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.131.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.132.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.132.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.133.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.133.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.134.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.134.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.135.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.135.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.136.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.136.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.137.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.137.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.138.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.138.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.139.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.139.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.140.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.140.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.141.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.141.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.142.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.142.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.143.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.143.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.144.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.144.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.145.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.145.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.146.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.146.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.147.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.147.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.148.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.148.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.149.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.149.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.150.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.150.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.151.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.151.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.152.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.152.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.153.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.153.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.154.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.154.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.155.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.155.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.156.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.156.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.157.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.157.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.158.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.158.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.159.gate_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.159.up_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.0.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.1.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.2.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.3.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.4.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.5.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.6.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.7.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.8.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.9.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.10.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.11.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.12.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.13.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.14.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.15.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.16.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.17.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.18.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.19.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.20.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.21.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.22.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.23.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.24.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.25.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.26.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.27.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.28.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.29.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.30.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.31.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.32.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.33.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.34.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.35.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.36.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.37.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.38.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.39.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.40.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.41.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.42.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.43.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.44.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.45.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.46.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.47.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.48.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.49.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.50.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.51.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.52.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.53.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.54.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.55.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.56.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.57.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.58.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.59.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.60.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.61.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.62.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.63.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.64.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.65.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.66.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.67.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.68.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.69.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.70.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.71.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.72.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.73.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.74.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.75.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.76.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.77.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.78.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.79.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.80.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.81.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.82.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.83.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.84.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.85.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.86.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.87.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.88.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.89.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.90.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.91.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.92.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.93.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.94.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.95.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.96.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.97.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.98.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.99.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.100.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.101.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.102.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.103.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.104.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.105.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.106.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.107.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.108.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.109.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.110.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.111.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.112.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.113.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.114.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.115.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.116.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.117.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.118.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.119.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.120.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.121.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.122.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.123.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.124.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.125.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.126.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.127.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.128.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.129.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.130.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.131.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.132.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.133.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.134.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.135.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.136.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.137.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.138.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.139.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.140.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.141.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.142.down_proj.weight": "model-00118-of-00132.safetensors", + "model.layers.83.mlp.experts.143.down_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.83.mlp.experts.144.down_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.83.mlp.experts.145.down_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.83.mlp.experts.146.down_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.83.mlp.experts.147.down_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.83.mlp.experts.148.down_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.83.mlp.experts.149.down_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.83.mlp.experts.150.down_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.83.mlp.experts.151.down_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.83.mlp.experts.152.down_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.83.mlp.experts.153.down_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.83.mlp.experts.154.down_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.83.mlp.experts.155.down_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.83.mlp.experts.156.down_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.83.mlp.experts.157.down_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.83.mlp.experts.158.down_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.83.mlp.experts.159.down_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.83.mlp.shared_experts.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.83.mlp.shared_experts.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.83.mlp.shared_experts.down_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.input_layernorm.weight": "model-00119-of-00132.safetensors", + "model.layers.84.self_attn.q_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.self_attn.k_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.self_attn.v_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.self_attn.q_proj.bias": "model-00119-of-00132.safetensors", + "model.layers.84.self_attn.k_proj.bias": "model-00119-of-00132.safetensors", + "model.layers.84.self_attn.v_proj.bias": "model-00119-of-00132.safetensors", + "model.layers.84.self_attn.q_norm.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.0.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.0.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.1.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.1.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.2.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.2.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.3.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.3.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.4.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.4.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.5.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.5.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.6.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.6.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.7.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.7.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.8.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.8.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.9.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.9.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.10.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.10.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.11.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.11.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.12.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.12.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.13.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.13.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.14.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.14.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.15.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.15.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.16.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.16.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.17.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.17.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.18.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.18.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.19.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.19.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.20.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.20.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.21.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.21.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.22.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.22.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.23.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.23.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.24.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.24.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.25.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.25.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.26.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.26.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.27.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.27.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.28.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.28.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.29.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.29.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.30.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.30.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.31.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.31.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.32.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.32.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.33.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.33.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.34.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.34.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.35.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.35.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.36.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.36.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.37.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.37.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.38.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.38.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.39.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.39.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.40.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.40.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.41.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.41.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.42.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.42.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.43.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.43.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.44.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.44.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.45.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.45.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.46.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.46.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.47.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.47.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.48.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.48.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.49.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.49.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.50.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.50.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.51.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.51.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.52.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.52.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.53.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.53.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.54.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.54.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.55.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.55.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.56.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.56.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.57.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.57.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.58.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.58.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.59.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.59.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.60.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.60.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.61.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.61.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.62.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.62.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.63.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.63.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.64.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.64.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.65.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.65.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.66.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.66.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.67.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.67.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.68.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.68.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.69.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.69.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.70.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.70.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.71.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.71.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.72.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.72.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.73.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.73.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.74.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.74.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.75.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.75.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.76.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.76.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.77.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.77.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.78.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.78.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.79.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.79.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.80.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.80.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.81.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.81.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.82.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.82.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.83.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.83.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.84.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.84.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.85.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.85.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.86.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.86.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.87.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.87.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.88.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.88.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.89.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.89.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.90.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.90.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.91.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.91.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.92.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.92.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.93.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.93.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.94.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.94.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.95.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.95.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.96.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.96.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.97.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.97.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.98.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.98.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.99.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.99.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.100.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.100.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.101.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.101.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.102.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.102.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.103.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.103.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.104.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.104.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.105.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.105.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.106.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.106.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.107.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.107.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.108.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.108.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.109.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.109.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.110.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.110.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.111.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.111.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.112.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.112.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.113.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.113.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.114.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.114.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.115.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.115.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.116.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.116.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.117.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.117.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.118.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.118.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.119.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.119.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.120.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.120.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.121.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.121.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.122.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.122.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.123.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.123.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.124.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.124.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.125.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.125.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.126.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.126.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.127.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.127.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.128.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.128.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.129.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.129.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.130.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.130.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.131.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.131.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.132.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.132.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.133.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.133.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.134.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.134.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.135.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.135.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.136.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.136.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.137.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.137.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.138.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.138.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.139.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.139.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.140.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.140.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.141.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.141.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.142.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.142.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.143.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.143.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.144.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.144.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.145.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.145.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.146.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.146.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.147.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.147.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.148.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.148.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.149.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.149.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.150.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.150.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.151.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.151.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.152.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.152.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.153.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.153.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.154.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.154.up_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.155.gate_proj.weight": "model-00119-of-00132.safetensors", + "model.layers.84.mlp.experts.155.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.156.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.156.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.157.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.157.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.158.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.158.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.159.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.159.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.0.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.1.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.2.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.3.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.4.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.5.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.6.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.7.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.8.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.9.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.10.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.11.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.12.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.13.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.14.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.15.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.16.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.17.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.18.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.19.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.20.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.21.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.22.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.23.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.24.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.25.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.26.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.27.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.28.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.29.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.30.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.31.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.32.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.33.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.34.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.35.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.36.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.37.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.38.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.39.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.40.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.41.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.42.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.43.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.44.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.45.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.46.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.47.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.48.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.49.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.50.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.51.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.52.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.53.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.54.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.55.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.56.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.57.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.58.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.59.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.60.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.61.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.62.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.63.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.64.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.65.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.66.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.67.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.68.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.69.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.70.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.71.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.72.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.73.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.74.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.75.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.76.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.77.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.78.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.79.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.80.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.81.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.82.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.83.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.84.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.85.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.86.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.87.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.88.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.89.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.90.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.91.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.92.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.93.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.94.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.95.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.96.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.97.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.98.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.99.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.100.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.101.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.102.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.103.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.104.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.105.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.106.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.107.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.108.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.109.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.110.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.111.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.112.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.113.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.114.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.115.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.116.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.117.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.118.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.119.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.120.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.121.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.122.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.123.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.124.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.125.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.126.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.127.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.128.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.129.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.130.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.131.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.132.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.133.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.134.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.135.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.136.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.137.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.138.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.139.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.140.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.141.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.142.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.143.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.144.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.145.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.146.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.147.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.148.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.149.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.150.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.151.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.152.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.153.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.154.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.155.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.156.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.157.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.158.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.experts.159.down_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.shared_experts.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.84.mlp.shared_experts.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.self_attn.o_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.input_layernorm.weight": "model-00120-of-00132.safetensors", + "model.layers.85.self_attn.q_norm.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.gate.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.gate.e_score_correction_bias": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.0.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.0.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.1.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.1.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.2.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.2.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.3.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.3.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.4.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.4.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.5.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.5.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.6.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.6.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.7.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.7.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.8.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.8.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.9.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.9.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.10.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.10.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.11.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.11.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.12.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.12.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.13.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.13.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.14.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.14.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.15.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.15.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.16.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.16.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.17.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.17.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.18.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.18.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.19.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.19.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.20.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.20.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.21.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.21.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.22.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.22.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.23.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.23.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.24.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.24.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.25.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.25.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.26.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.26.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.27.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.27.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.28.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.28.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.29.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.29.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.30.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.30.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.31.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.31.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.32.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.32.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.33.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.33.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.34.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.34.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.35.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.35.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.36.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.36.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.37.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.37.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.38.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.38.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.39.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.39.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.40.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.40.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.41.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.41.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.42.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.42.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.43.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.43.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.44.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.44.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.45.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.45.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.46.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.46.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.47.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.47.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.48.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.48.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.49.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.49.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.50.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.50.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.51.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.51.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.52.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.52.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.53.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.53.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.54.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.54.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.55.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.55.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.56.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.56.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.57.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.57.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.58.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.58.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.59.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.59.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.60.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.60.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.61.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.61.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.62.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.62.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.63.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.63.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.64.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.64.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.65.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.65.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.66.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.66.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.67.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.67.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.68.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.68.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.69.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.69.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.70.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.70.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.71.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.71.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.72.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.72.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.73.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.73.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.74.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.74.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.75.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.75.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.76.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.76.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.77.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.77.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.78.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.78.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.79.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.79.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.80.gate_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.80.up_proj.weight": "model-00120-of-00132.safetensors", + "model.layers.85.mlp.experts.81.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.81.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.82.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.82.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.83.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.83.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.84.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.84.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.85.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.85.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.86.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.86.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.87.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.87.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.88.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.88.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.89.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.89.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.90.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.90.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.91.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.91.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.92.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.92.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.93.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.93.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.94.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.94.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.95.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.95.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.96.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.96.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.97.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.97.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.98.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.98.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.99.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.99.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.100.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.100.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.101.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.101.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.102.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.102.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.103.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.103.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.104.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.104.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.105.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.105.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.106.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.106.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.107.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.107.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.108.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.108.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.109.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.109.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.110.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.110.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.111.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.111.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.112.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.112.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.113.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.113.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.114.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.114.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.115.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.115.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.116.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.116.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.117.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.117.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.118.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.118.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.119.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.119.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.120.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.120.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.121.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.121.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.122.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.122.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.123.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.123.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.124.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.124.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.125.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.125.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.126.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.126.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.127.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.127.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.128.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.128.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.129.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.129.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.130.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.130.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.131.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.131.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.132.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.132.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.133.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.133.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.134.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.134.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.135.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.135.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.136.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.136.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.137.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.137.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.138.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.138.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.139.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.139.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.140.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.140.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.141.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.141.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.142.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.142.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.143.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.143.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.144.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.144.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.145.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.145.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.146.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.146.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.147.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.147.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.148.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.148.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.149.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.149.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.150.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.150.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.151.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.151.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.152.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.152.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.153.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.153.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.154.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.154.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.155.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.155.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.156.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.156.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.157.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.157.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.158.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.158.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.159.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.159.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.0.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.1.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.2.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.3.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.4.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.5.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.6.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.7.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.8.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.9.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.10.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.11.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.12.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.13.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.14.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.15.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.16.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.17.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.18.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.19.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.20.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.21.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.22.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.23.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.24.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.25.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.26.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.27.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.28.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.29.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.30.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.31.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.32.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.33.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.34.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.35.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.36.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.37.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.38.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.39.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.40.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.41.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.42.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.43.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.44.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.45.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.46.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.47.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.48.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.49.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.50.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.51.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.52.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.53.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.54.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.55.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.56.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.57.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.58.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.59.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.60.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.61.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.62.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.63.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.64.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.65.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.66.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.67.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.68.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.69.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.70.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.71.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.72.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.73.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.74.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.75.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.76.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.77.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.78.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.79.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.80.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.81.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.82.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.83.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.84.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.85.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.86.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.87.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.88.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.89.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.90.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.91.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.92.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.93.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.94.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.95.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.96.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.97.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.98.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.99.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.100.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.101.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.102.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.103.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.104.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.105.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.106.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.107.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.108.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.109.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.110.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.111.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.112.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.113.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.114.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.115.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.116.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.117.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.118.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.119.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.120.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.121.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.122.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.123.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.124.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.125.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.126.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.127.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.128.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.129.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.130.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.131.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.132.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.133.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.134.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.135.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.136.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.137.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.138.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.139.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.140.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.141.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.142.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.143.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.144.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.145.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.146.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.147.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.148.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.149.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.150.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.151.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.152.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.153.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.154.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.155.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.156.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.157.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.158.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.experts.159.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.shared_experts.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.shared_experts.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.85.mlp.shared_experts.down_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.86.input_layernorm.weight": "model-00121-of-00132.safetensors", + "model.layers.86.self_attn.q_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.86.self_attn.k_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.86.self_attn.v_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.86.self_attn.q_proj.bias": "model-00121-of-00132.safetensors", + "model.layers.86.self_attn.k_proj.bias": "model-00121-of-00132.safetensors", + "model.layers.86.self_attn.v_proj.bias": "model-00121-of-00132.safetensors", + "model.layers.86.self_attn.q_norm.weight": "model-00121-of-00132.safetensors", + "model.layers.86.mlp.experts.0.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.86.mlp.experts.0.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.86.mlp.experts.1.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.86.mlp.experts.1.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.86.mlp.experts.2.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.86.mlp.experts.2.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.86.mlp.experts.3.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.86.mlp.experts.3.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.86.mlp.experts.4.gate_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.86.mlp.experts.4.up_proj.weight": "model-00121-of-00132.safetensors", + "model.layers.86.mlp.experts.5.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.5.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.6.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.6.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.7.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.7.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.8.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.8.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.9.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.9.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.10.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.10.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.11.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.11.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.12.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.12.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.13.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.13.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.14.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.14.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.15.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.15.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.16.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.16.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.17.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.17.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.18.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.18.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.19.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.19.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.20.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.20.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.21.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.21.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.22.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.22.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.23.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.23.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.24.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.24.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.25.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.25.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.26.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.26.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.27.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.27.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.28.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.28.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.29.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.29.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.30.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.30.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.31.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.31.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.32.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.32.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.33.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.33.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.34.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.34.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.35.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.35.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.36.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.36.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.37.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.37.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.38.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.38.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.39.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.39.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.40.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.40.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.41.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.41.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.42.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.42.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.43.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.43.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.44.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.44.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.45.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.45.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.46.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.46.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.47.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.47.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.48.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.48.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.49.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.49.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.50.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.50.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.51.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.51.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.52.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.52.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.53.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.53.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.54.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.54.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.55.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.55.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.56.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.56.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.57.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.57.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.58.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.58.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.59.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.59.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.60.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.60.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.61.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.61.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.62.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.62.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.63.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.63.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.64.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.64.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.65.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.65.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.66.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.66.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.67.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.67.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.68.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.68.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.69.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.69.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.70.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.70.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.71.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.71.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.72.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.72.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.73.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.73.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.74.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.74.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.75.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.75.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.76.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.76.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.77.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.77.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.78.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.78.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.79.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.79.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.80.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.80.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.81.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.81.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.82.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.82.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.83.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.83.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.84.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.84.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.85.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.85.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.86.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.86.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.87.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.87.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.88.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.88.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.89.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.89.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.90.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.90.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.91.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.91.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.92.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.92.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.93.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.93.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.94.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.94.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.95.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.95.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.96.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.96.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.97.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.97.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.98.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.98.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.99.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.99.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.100.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.100.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.101.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.101.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.102.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.102.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.103.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.103.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.104.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.104.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.105.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.105.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.106.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.106.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.107.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.107.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.108.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.108.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.109.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.109.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.110.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.110.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.111.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.111.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.112.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.112.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.113.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.113.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.114.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.114.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.115.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.115.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.116.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.116.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.117.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.117.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.118.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.118.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.119.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.119.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.120.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.120.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.121.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.121.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.122.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.122.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.123.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.123.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.124.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.124.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.125.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.125.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.126.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.126.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.127.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.127.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.128.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.128.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.129.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.129.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.130.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.130.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.131.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.131.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.132.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.132.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.133.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.133.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.134.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.134.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.135.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.135.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.136.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.136.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.137.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.137.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.138.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.138.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.139.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.139.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.140.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.140.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.141.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.141.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.142.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.142.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.143.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.143.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.144.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.144.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.145.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.145.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.146.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.146.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.147.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.147.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.148.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.148.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.149.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.149.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.150.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.150.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.151.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.151.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.152.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.152.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.153.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.153.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.154.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.154.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.155.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.155.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.156.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.156.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.157.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.157.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.158.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.158.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.159.gate_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.159.up_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.0.down_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.1.down_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.2.down_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.3.down_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.4.down_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.5.down_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.6.down_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.7.down_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.8.down_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.9.down_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.10.down_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.11.down_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.12.down_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.13.down_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.14.down_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.15.down_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.16.down_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.17.down_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.18.down_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.19.down_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.20.down_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.21.down_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.22.down_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.23.down_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.24.down_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.25.down_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.26.down_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.27.down_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.28.down_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.29.down_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.30.down_proj.weight": "model-00122-of-00132.safetensors", + "model.layers.86.mlp.experts.31.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.32.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.33.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.34.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.35.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.36.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.37.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.38.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.39.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.40.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.41.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.42.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.43.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.44.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.45.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.46.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.47.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.48.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.49.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.50.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.51.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.52.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.53.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.54.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.55.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.56.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.57.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.58.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.59.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.60.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.61.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.62.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.63.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.64.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.65.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.66.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.67.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.68.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.69.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.70.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.71.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.72.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.73.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.74.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.75.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.76.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.77.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.78.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.79.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.80.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.81.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.82.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.83.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.84.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.85.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.86.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.87.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.88.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.89.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.90.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.91.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.92.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.93.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.94.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.95.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.96.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.97.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.98.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.99.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.100.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.101.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.102.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.103.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.104.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.105.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.106.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.107.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.108.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.109.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.110.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.111.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.112.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.113.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.114.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.115.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.116.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.117.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.118.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.119.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.120.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.121.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.122.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.123.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.124.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.125.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.126.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.127.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.128.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.129.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.130.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.131.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.132.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.133.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.134.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.135.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.136.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.137.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.138.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.139.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.140.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.141.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.142.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.143.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.144.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.145.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.146.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.147.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.148.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.149.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.150.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.151.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.152.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.153.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.154.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.155.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.156.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.157.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.158.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.experts.159.down_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.shared_experts.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.86.mlp.shared_experts.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.self_attn.o_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.input_layernorm.weight": "model-00123-of-00132.safetensors", + "model.layers.87.self_attn.q_norm.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.gate.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.gate.e_score_correction_bias": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.0.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.0.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.1.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.1.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.2.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.2.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.3.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.3.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.4.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.4.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.5.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.5.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.6.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.6.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.7.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.7.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.8.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.8.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.9.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.9.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.10.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.10.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.11.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.11.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.12.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.12.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.13.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.13.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.14.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.14.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.15.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.15.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.16.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.16.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.17.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.17.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.18.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.18.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.19.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.19.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.20.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.20.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.21.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.21.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.22.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.22.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.23.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.23.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.24.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.24.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.25.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.25.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.26.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.26.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.27.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.27.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.28.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.28.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.29.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.29.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.30.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.30.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.31.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.31.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.32.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.32.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.33.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.33.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.34.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.34.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.35.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.35.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.36.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.36.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.37.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.37.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.38.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.38.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.39.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.39.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.40.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.40.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.41.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.41.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.42.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.42.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.43.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.43.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.44.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.44.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.45.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.45.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.46.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.46.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.47.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.47.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.48.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.48.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.49.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.49.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.50.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.50.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.51.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.51.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.52.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.52.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.53.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.53.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.54.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.54.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.55.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.55.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.56.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.56.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.57.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.57.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.58.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.58.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.59.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.59.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.60.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.60.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.61.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.61.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.62.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.62.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.63.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.63.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.64.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.64.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.65.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.65.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.66.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.66.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.67.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.67.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.68.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.68.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.69.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.69.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.70.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.70.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.71.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.71.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.72.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.72.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.73.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.73.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.74.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.74.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.75.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.75.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.76.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.76.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.77.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.77.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.78.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.78.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.79.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.79.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.80.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.80.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.81.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.81.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.82.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.82.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.83.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.83.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.84.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.84.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.85.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.85.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.86.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.86.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.87.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.87.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.88.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.88.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.89.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.89.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.90.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.90.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.91.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.91.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.92.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.92.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.93.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.93.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.94.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.94.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.95.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.95.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.96.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.96.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.97.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.97.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.98.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.98.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.99.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.99.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.100.gate_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.100.up_proj.weight": "model-00123-of-00132.safetensors", + "model.layers.87.mlp.experts.101.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.101.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.102.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.102.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.103.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.103.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.104.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.104.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.105.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.105.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.106.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.106.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.107.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.107.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.108.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.108.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.109.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.109.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.110.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.110.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.111.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.111.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.112.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.112.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.113.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.113.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.114.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.114.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.115.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.115.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.116.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.116.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.117.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.117.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.118.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.118.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.119.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.119.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.120.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.120.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.121.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.121.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.122.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.122.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.123.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.123.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.124.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.124.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.125.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.125.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.126.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.126.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.127.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.127.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.128.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.128.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.129.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.129.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.130.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.130.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.131.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.131.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.132.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.132.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.133.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.133.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.134.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.134.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.135.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.135.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.136.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.136.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.137.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.137.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.138.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.138.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.139.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.139.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.140.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.140.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.141.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.141.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.142.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.142.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.143.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.143.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.144.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.144.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.145.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.145.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.146.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.146.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.147.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.147.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.148.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.148.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.149.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.149.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.150.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.150.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.151.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.151.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.152.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.152.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.153.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.153.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.154.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.154.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.155.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.155.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.156.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.156.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.157.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.157.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.158.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.158.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.159.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.159.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.0.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.1.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.2.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.3.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.4.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.5.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.6.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.7.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.8.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.9.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.10.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.11.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.12.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.13.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.14.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.15.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.16.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.17.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.18.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.19.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.20.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.21.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.22.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.23.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.24.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.25.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.26.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.27.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.28.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.29.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.30.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.31.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.32.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.33.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.34.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.35.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.36.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.37.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.38.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.39.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.40.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.41.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.42.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.43.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.44.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.45.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.46.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.47.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.48.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.49.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.50.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.51.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.52.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.53.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.54.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.55.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.56.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.57.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.58.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.59.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.60.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.61.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.62.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.63.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.64.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.65.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.66.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.67.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.68.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.69.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.70.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.71.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.72.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.73.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.74.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.75.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.76.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.77.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.78.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.79.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.80.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.81.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.82.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.83.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.84.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.85.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.86.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.87.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.88.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.89.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.90.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.91.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.92.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.93.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.94.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.95.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.96.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.97.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.98.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.99.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.100.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.101.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.102.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.103.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.104.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.105.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.106.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.107.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.108.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.109.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.110.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.111.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.112.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.113.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.114.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.115.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.116.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.117.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.118.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.119.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.120.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.121.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.122.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.123.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.124.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.125.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.126.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.127.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.128.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.129.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.130.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.131.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.132.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.133.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.134.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.135.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.136.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.137.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.138.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.139.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.140.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.141.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.142.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.143.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.144.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.145.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.146.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.147.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.148.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.149.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.150.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.151.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.152.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.153.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.154.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.155.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.156.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.157.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.158.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.experts.159.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.shared_experts.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.shared_experts.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.87.mlp.shared_experts.down_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.88.input_layernorm.weight": "model-00124-of-00132.safetensors", + "model.layers.88.self_attn.q_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.88.self_attn.k_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.88.self_attn.v_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.88.self_attn.q_proj.bias": "model-00124-of-00132.safetensors", + "model.layers.88.self_attn.k_proj.bias": "model-00124-of-00132.safetensors", + "model.layers.88.self_attn.v_proj.bias": "model-00124-of-00132.safetensors", + "model.layers.88.self_attn.q_norm.weight": "model-00124-of-00132.safetensors", + "model.layers.88.mlp.experts.0.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.88.mlp.experts.0.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.88.mlp.experts.1.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.88.mlp.experts.1.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.88.mlp.experts.2.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.88.mlp.experts.2.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.88.mlp.experts.3.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.88.mlp.experts.3.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.88.mlp.experts.4.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.88.mlp.experts.4.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.88.mlp.experts.5.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.88.mlp.experts.5.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.88.mlp.experts.6.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.88.mlp.experts.6.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.88.mlp.experts.7.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.88.mlp.experts.7.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.88.mlp.experts.8.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.88.mlp.experts.8.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.88.mlp.experts.9.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.88.mlp.experts.9.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.88.mlp.experts.10.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.88.mlp.experts.10.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.88.mlp.experts.11.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.88.mlp.experts.11.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.88.mlp.experts.12.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.88.mlp.experts.12.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.88.mlp.experts.13.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.88.mlp.experts.13.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.88.mlp.experts.14.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.88.mlp.experts.14.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.88.mlp.experts.15.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.88.mlp.experts.15.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.88.mlp.experts.16.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.88.mlp.experts.16.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.88.mlp.experts.17.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.88.mlp.experts.17.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.88.mlp.experts.18.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.88.mlp.experts.18.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.88.mlp.experts.19.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.88.mlp.experts.19.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.88.mlp.experts.20.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.88.mlp.experts.20.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.88.mlp.experts.21.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.88.mlp.experts.21.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.88.mlp.experts.22.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.88.mlp.experts.22.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.88.mlp.experts.23.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.88.mlp.experts.23.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.88.mlp.experts.24.gate_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.88.mlp.experts.24.up_proj.weight": "model-00124-of-00132.safetensors", + "model.layers.88.mlp.experts.25.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.25.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.26.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.26.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.27.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.27.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.28.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.28.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.29.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.29.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.30.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.30.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.31.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.31.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.32.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.32.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.33.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.33.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.34.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.34.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.35.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.35.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.36.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.36.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.37.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.37.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.38.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.38.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.39.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.39.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.40.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.40.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.41.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.41.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.42.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.42.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.43.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.43.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.44.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.44.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.45.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.45.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.46.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.46.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.47.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.47.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.48.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.48.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.49.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.49.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.50.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.50.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.51.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.51.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.52.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.52.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.53.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.53.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.54.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.54.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.55.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.55.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.56.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.56.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.57.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.57.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.58.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.58.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.59.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.59.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.60.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.60.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.61.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.61.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.62.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.62.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.63.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.63.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.64.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.64.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.65.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.65.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.66.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.66.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.67.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.67.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.68.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.68.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.69.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.69.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.70.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.70.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.71.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.71.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.72.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.72.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.73.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.73.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.74.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.74.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.75.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.75.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.76.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.76.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.77.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.77.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.78.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.78.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.79.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.79.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.80.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.80.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.81.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.81.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.82.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.82.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.83.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.83.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.84.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.84.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.85.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.85.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.86.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.86.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.87.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.87.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.88.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.88.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.89.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.89.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.90.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.90.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.91.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.91.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.92.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.92.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.93.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.93.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.94.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.94.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.95.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.95.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.96.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.96.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.97.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.97.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.98.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.98.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.99.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.99.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.100.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.100.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.101.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.101.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.102.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.102.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.103.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.103.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.104.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.104.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.105.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.105.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.106.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.106.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.107.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.107.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.108.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.108.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.109.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.109.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.110.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.110.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.111.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.111.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.112.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.112.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.113.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.113.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.114.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.114.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.115.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.115.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.116.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.116.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.117.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.117.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.118.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.118.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.119.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.119.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.120.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.120.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.121.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.121.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.122.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.122.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.123.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.123.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.124.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.124.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.125.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.125.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.126.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.126.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.127.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.127.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.128.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.128.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.129.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.129.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.130.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.130.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.131.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.131.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.132.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.132.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.133.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.133.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.134.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.134.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.135.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.135.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.136.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.136.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.137.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.137.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.138.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.138.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.139.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.139.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.140.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.140.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.141.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.141.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.142.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.142.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.143.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.143.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.144.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.144.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.145.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.145.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.146.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.146.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.147.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.147.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.148.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.148.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.149.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.149.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.150.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.150.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.151.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.151.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.152.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.152.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.153.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.153.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.154.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.154.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.155.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.155.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.156.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.156.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.157.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.157.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.158.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.158.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.159.gate_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.159.up_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.0.down_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.1.down_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.2.down_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.3.down_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.4.down_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.5.down_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.6.down_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.7.down_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.8.down_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.9.down_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.10.down_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.11.down_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.12.down_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.13.down_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.14.down_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.15.down_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.16.down_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.17.down_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.18.down_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.19.down_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.20.down_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.21.down_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.22.down_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.23.down_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.24.down_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.25.down_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.26.down_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.27.down_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.28.down_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.29.down_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.30.down_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.31.down_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.32.down_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.33.down_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.34.down_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.35.down_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.36.down_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.37.down_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.38.down_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.39.down_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.40.down_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.41.down_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.42.down_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.43.down_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.44.down_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.45.down_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.46.down_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.47.down_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.48.down_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.49.down_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.50.down_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.51.down_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.52.down_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.53.down_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.54.down_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.55.down_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.56.down_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.57.down_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.58.down_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.59.down_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.60.down_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.61.down_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.62.down_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.63.down_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.64.down_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.65.down_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.66.down_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.67.down_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.68.down_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.69.down_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.70.down_proj.weight": "model-00125-of-00132.safetensors", + "model.layers.88.mlp.experts.71.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.72.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.73.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.74.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.75.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.76.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.77.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.78.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.79.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.80.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.81.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.82.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.83.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.84.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.85.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.86.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.87.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.88.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.89.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.90.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.91.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.92.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.93.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.94.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.95.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.96.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.97.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.98.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.99.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.100.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.101.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.102.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.103.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.104.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.105.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.106.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.107.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.108.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.109.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.110.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.111.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.112.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.113.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.114.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.115.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.116.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.117.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.118.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.119.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.120.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.121.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.122.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.123.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.124.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.125.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.126.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.127.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.128.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.129.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.130.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.131.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.132.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.133.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.134.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.135.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.136.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.137.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.138.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.139.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.140.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.141.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.142.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.143.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.144.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.145.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.146.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.147.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.148.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.149.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.150.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.151.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.152.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.153.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.154.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.155.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.156.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.157.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.158.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.experts.159.down_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.shared_experts.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.88.mlp.shared_experts.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.self_attn.o_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.input_layernorm.weight": "model-00126-of-00132.safetensors", + "model.layers.89.self_attn.q_norm.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.gate.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.gate.e_score_correction_bias": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.0.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.0.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.1.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.1.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.2.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.2.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.3.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.3.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.4.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.4.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.5.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.5.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.6.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.6.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.7.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.7.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.8.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.8.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.9.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.9.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.10.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.10.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.11.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.11.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.12.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.12.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.13.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.13.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.14.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.14.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.15.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.15.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.16.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.16.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.17.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.17.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.18.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.18.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.19.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.19.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.20.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.20.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.21.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.21.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.22.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.22.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.23.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.23.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.24.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.24.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.25.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.25.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.26.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.26.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.27.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.27.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.28.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.28.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.29.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.29.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.30.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.30.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.31.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.31.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.32.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.32.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.33.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.33.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.34.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.34.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.35.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.35.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.36.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.36.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.37.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.37.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.38.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.38.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.39.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.39.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.40.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.40.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.41.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.41.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.42.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.42.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.43.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.43.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.44.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.44.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.45.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.45.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.46.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.46.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.47.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.47.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.48.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.48.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.49.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.49.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.50.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.50.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.51.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.51.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.52.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.52.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.53.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.53.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.54.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.54.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.55.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.55.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.56.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.56.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.57.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.57.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.58.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.58.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.59.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.59.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.60.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.60.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.61.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.61.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.62.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.62.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.63.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.63.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.64.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.64.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.65.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.65.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.66.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.66.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.67.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.67.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.68.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.68.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.69.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.69.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.70.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.70.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.71.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.71.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.72.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.72.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.73.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.73.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.74.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.74.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.75.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.75.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.76.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.76.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.77.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.77.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.78.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.78.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.79.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.79.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.80.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.80.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.81.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.81.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.82.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.82.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.83.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.83.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.84.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.84.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.85.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.85.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.86.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.86.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.87.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.87.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.88.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.88.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.89.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.89.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.90.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.90.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.91.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.91.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.92.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.92.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.93.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.93.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.94.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.94.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.95.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.95.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.96.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.96.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.97.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.97.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.98.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.98.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.99.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.99.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.100.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.100.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.101.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.101.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.102.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.102.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.103.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.103.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.104.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.104.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.105.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.105.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.106.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.106.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.107.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.107.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.108.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.108.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.109.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.109.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.110.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.110.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.111.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.111.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.112.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.112.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.113.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.113.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.114.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.114.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.115.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.115.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.116.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.116.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.117.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.117.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.118.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.118.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.119.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.119.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.120.gate_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.120.up_proj.weight": "model-00126-of-00132.safetensors", + "model.layers.89.mlp.experts.121.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.121.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.122.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.122.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.123.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.123.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.124.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.124.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.125.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.125.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.126.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.126.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.127.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.127.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.128.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.128.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.129.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.129.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.130.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.130.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.131.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.131.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.132.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.132.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.133.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.133.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.134.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.134.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.135.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.135.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.136.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.136.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.137.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.137.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.138.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.138.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.139.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.139.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.140.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.140.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.141.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.141.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.142.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.142.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.143.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.143.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.144.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.144.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.145.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.145.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.146.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.146.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.147.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.147.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.148.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.148.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.149.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.149.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.150.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.150.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.151.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.151.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.152.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.152.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.153.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.153.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.154.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.154.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.155.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.155.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.156.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.156.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.157.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.157.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.158.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.158.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.159.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.159.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.0.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.1.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.2.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.3.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.4.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.5.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.6.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.7.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.8.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.9.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.10.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.11.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.12.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.13.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.14.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.15.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.16.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.17.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.18.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.19.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.20.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.21.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.22.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.23.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.24.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.25.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.26.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.27.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.28.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.29.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.30.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.31.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.32.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.33.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.34.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.35.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.36.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.37.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.38.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.39.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.40.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.41.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.42.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.43.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.44.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.45.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.46.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.47.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.48.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.49.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.50.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.51.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.52.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.53.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.54.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.55.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.56.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.57.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.58.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.59.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.60.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.61.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.62.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.63.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.64.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.65.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.66.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.67.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.68.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.69.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.70.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.71.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.72.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.73.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.74.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.75.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.76.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.77.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.78.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.79.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.80.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.81.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.82.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.83.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.84.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.85.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.86.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.87.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.88.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.89.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.90.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.91.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.92.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.93.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.94.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.95.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.96.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.97.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.98.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.99.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.100.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.101.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.102.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.103.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.104.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.105.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.106.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.107.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.108.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.109.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.110.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.111.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.112.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.113.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.114.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.115.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.116.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.117.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.118.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.119.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.120.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.121.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.122.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.123.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.124.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.125.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.126.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.127.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.128.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.129.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.130.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.131.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.132.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.133.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.134.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.135.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.136.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.137.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.138.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.139.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.140.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.141.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.142.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.143.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.144.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.145.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.146.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.147.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.148.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.149.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.150.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.151.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.152.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.153.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.154.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.155.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.156.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.157.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.158.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.experts.159.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.shared_experts.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.shared_experts.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.89.mlp.shared_experts.down_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.input_layernorm.weight": "model-00127-of-00132.safetensors", + "model.layers.90.self_attn.q_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.self_attn.k_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.self_attn.v_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.self_attn.q_proj.bias": "model-00127-of-00132.safetensors", + "model.layers.90.self_attn.k_proj.bias": "model-00127-of-00132.safetensors", + "model.layers.90.self_attn.v_proj.bias": "model-00127-of-00132.safetensors", + "model.layers.90.self_attn.q_norm.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.0.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.0.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.1.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.1.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.2.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.2.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.3.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.3.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.4.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.4.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.5.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.5.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.6.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.6.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.7.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.7.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.8.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.8.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.9.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.9.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.10.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.10.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.11.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.11.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.12.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.12.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.13.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.13.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.14.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.14.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.15.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.15.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.16.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.16.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.17.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.17.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.18.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.18.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.19.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.19.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.20.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.20.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.21.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.21.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.22.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.22.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.23.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.23.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.24.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.24.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.25.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.25.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.26.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.26.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.27.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.27.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.28.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.28.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.29.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.29.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.30.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.30.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.31.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.31.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.32.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.32.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.33.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.33.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.34.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.34.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.35.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.35.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.36.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.36.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.37.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.37.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.38.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.38.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.39.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.39.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.40.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.40.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.41.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.41.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.42.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.42.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.43.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.43.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.44.gate_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.44.up_proj.weight": "model-00127-of-00132.safetensors", + "model.layers.90.mlp.experts.45.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.45.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.46.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.46.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.47.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.47.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.48.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.48.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.49.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.49.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.50.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.50.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.51.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.51.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.52.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.52.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.53.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.53.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.54.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.54.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.55.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.55.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.56.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.56.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.57.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.57.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.58.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.58.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.59.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.59.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.60.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.60.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.61.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.61.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.62.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.62.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.63.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.63.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.64.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.64.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.65.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.65.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.66.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.66.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.67.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.67.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.68.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.68.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.69.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.69.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.70.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.70.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.71.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.71.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.72.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.72.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.73.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.73.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.74.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.74.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.75.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.75.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.76.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.76.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.77.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.77.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.78.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.78.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.79.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.79.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.80.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.80.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.81.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.81.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.82.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.82.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.83.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.83.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.84.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.84.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.85.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.85.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.86.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.86.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.87.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.87.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.88.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.88.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.89.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.89.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.90.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.90.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.91.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.91.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.92.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.92.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.93.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.93.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.94.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.94.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.95.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.95.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.96.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.96.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.97.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.97.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.98.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.98.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.99.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.99.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.100.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.100.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.101.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.101.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.102.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.102.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.103.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.103.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.104.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.104.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.105.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.105.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.106.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.106.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.107.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.107.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.108.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.108.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.109.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.109.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.110.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.110.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.111.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.111.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.112.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.112.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.113.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.113.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.114.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.114.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.115.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.115.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.116.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.116.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.117.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.117.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.118.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.118.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.119.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.119.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.120.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.120.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.121.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.121.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.122.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.122.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.123.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.123.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.124.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.124.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.125.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.125.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.126.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.126.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.127.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.127.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.128.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.128.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.129.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.129.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.130.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.130.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.131.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.131.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.132.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.132.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.133.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.133.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.134.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.134.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.135.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.135.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.136.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.136.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.137.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.137.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.138.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.138.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.139.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.139.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.140.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.140.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.141.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.141.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.142.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.142.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.143.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.143.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.144.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.144.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.145.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.145.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.146.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.146.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.147.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.147.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.148.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.148.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.149.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.149.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.150.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.150.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.151.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.151.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.152.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.152.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.153.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.153.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.154.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.154.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.155.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.155.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.156.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.156.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.157.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.157.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.158.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.158.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.159.gate_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.159.up_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.0.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.1.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.2.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.3.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.4.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.5.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.6.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.7.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.8.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.9.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.10.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.11.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.12.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.13.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.14.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.15.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.16.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.17.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.18.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.19.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.20.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.21.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.22.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.23.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.24.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.25.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.26.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.27.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.28.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.29.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.30.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.31.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.32.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.33.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.34.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.35.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.36.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.37.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.38.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.39.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.40.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.41.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.42.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.43.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.44.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.45.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.46.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.47.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.48.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.49.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.50.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.51.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.52.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.53.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.54.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.55.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.56.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.57.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.58.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.59.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.60.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.61.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.62.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.63.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.64.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.65.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.66.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.67.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.68.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.69.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.70.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.71.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.72.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.73.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.74.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.75.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.76.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.77.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.78.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.79.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.80.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.81.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.82.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.83.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.84.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.85.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.86.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.87.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.88.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.89.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.90.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.91.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.92.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.93.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.94.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.95.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.96.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.97.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.98.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.99.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.100.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.101.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.102.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.103.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.104.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.105.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.106.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.107.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.108.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.109.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.110.down_proj.weight": "model-00128-of-00132.safetensors", + "model.layers.90.mlp.experts.111.down_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.90.mlp.experts.112.down_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.90.mlp.experts.113.down_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.90.mlp.experts.114.down_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.90.mlp.experts.115.down_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.90.mlp.experts.116.down_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.90.mlp.experts.117.down_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.90.mlp.experts.118.down_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.90.mlp.experts.119.down_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.90.mlp.experts.120.down_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.90.mlp.experts.121.down_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.90.mlp.experts.122.down_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.90.mlp.experts.123.down_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.90.mlp.experts.124.down_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.90.mlp.experts.125.down_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.90.mlp.experts.126.down_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.90.mlp.experts.127.down_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.90.mlp.experts.128.down_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.90.mlp.experts.129.down_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.90.mlp.experts.130.down_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.90.mlp.experts.131.down_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.90.mlp.experts.132.down_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.90.mlp.experts.133.down_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.90.mlp.experts.134.down_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.90.mlp.experts.135.down_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.90.mlp.experts.136.down_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.90.mlp.experts.137.down_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.90.mlp.experts.138.down_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.90.mlp.experts.139.down_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.90.mlp.experts.140.down_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.90.mlp.experts.141.down_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.90.mlp.experts.142.down_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.90.mlp.experts.143.down_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.90.mlp.experts.144.down_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.90.mlp.experts.145.down_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.90.mlp.experts.146.down_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.90.mlp.experts.147.down_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.90.mlp.experts.148.down_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.90.mlp.experts.149.down_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.90.mlp.experts.150.down_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.90.mlp.experts.151.down_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.90.mlp.experts.152.down_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.90.mlp.experts.153.down_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.90.mlp.experts.154.down_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.90.mlp.experts.155.down_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.90.mlp.experts.156.down_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.90.mlp.experts.157.down_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.90.mlp.experts.158.down_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.90.mlp.experts.159.down_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.90.mlp.shared_experts.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.90.mlp.shared_experts.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.self_attn.o_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.input_layernorm.weight": "model-00129-of-00132.safetensors", + "model.layers.91.self_attn.q_norm.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.gate.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.gate.e_score_correction_bias": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.0.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.0.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.1.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.1.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.2.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.2.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.3.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.3.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.4.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.4.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.5.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.5.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.6.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.6.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.7.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.7.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.8.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.8.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.9.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.9.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.10.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.10.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.11.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.11.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.12.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.12.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.13.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.13.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.14.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.14.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.15.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.15.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.16.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.16.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.17.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.17.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.18.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.18.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.19.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.19.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.20.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.20.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.21.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.21.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.22.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.22.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.23.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.23.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.24.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.24.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.25.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.25.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.26.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.26.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.27.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.27.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.28.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.28.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.29.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.29.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.30.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.30.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.31.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.31.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.32.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.32.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.33.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.33.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.34.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.34.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.35.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.35.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.36.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.36.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.37.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.37.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.38.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.38.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.39.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.39.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.40.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.40.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.41.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.41.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.42.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.42.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.43.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.43.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.44.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.44.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.45.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.45.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.46.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.46.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.47.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.47.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.48.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.48.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.49.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.49.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.50.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.50.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.51.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.51.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.52.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.52.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.53.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.53.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.54.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.54.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.55.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.55.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.56.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.56.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.57.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.57.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.58.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.58.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.59.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.59.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.60.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.60.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.61.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.61.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.62.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.62.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.63.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.63.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.64.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.64.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.65.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.65.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.66.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.66.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.67.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.67.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.68.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.68.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.69.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.69.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.70.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.70.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.71.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.71.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.72.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.72.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.73.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.73.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.74.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.74.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.75.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.75.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.76.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.76.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.77.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.77.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.78.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.78.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.79.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.79.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.80.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.80.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.81.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.81.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.82.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.82.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.83.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.83.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.84.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.84.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.85.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.85.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.86.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.86.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.87.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.87.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.88.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.88.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.89.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.89.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.90.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.90.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.91.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.91.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.92.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.92.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.93.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.93.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.94.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.94.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.95.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.95.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.96.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.96.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.97.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.97.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.98.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.98.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.99.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.99.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.100.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.100.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.101.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.101.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.102.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.102.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.103.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.103.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.104.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.104.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.105.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.105.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.106.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.106.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.107.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.107.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.108.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.108.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.109.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.109.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.110.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.110.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.111.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.111.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.112.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.112.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.113.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.113.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.114.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.114.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.115.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.115.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.116.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.116.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.117.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.117.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.118.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.118.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.119.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.119.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.120.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.120.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.121.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.121.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.122.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.122.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.123.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.123.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.124.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.124.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.125.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.125.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.126.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.126.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.127.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.127.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.128.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.128.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.129.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.129.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.130.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.130.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.131.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.131.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.132.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.132.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.133.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.133.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.134.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.134.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.135.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.135.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.136.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.136.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.137.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.137.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.138.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.138.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.139.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.139.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.140.gate_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.140.up_proj.weight": "model-00129-of-00132.safetensors", + "model.layers.91.mlp.experts.141.gate_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.141.up_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.142.gate_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.142.up_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.143.gate_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.143.up_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.144.gate_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.144.up_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.145.gate_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.145.up_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.146.gate_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.146.up_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.147.gate_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.147.up_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.148.gate_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.148.up_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.149.gate_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.149.up_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.150.gate_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.150.up_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.151.gate_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.151.up_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.152.gate_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.152.up_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.153.gate_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.153.up_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.154.gate_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.154.up_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.155.gate_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.155.up_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.156.gate_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.156.up_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.157.gate_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.157.up_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.158.gate_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.158.up_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.159.gate_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.159.up_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.0.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.1.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.2.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.3.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.4.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.5.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.6.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.7.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.8.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.9.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.10.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.11.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.12.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.13.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.14.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.15.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.16.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.17.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.18.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.19.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.20.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.21.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.22.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.23.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.24.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.25.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.26.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.27.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.28.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.29.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.30.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.31.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.32.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.33.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.34.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.35.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.36.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.37.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.38.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.39.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.40.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.41.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.42.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.43.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.44.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.45.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.46.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.47.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.48.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.49.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.50.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.51.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.52.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.53.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.54.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.55.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.56.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.57.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.58.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.59.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.60.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.61.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.62.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.63.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.64.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.65.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.66.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.67.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.68.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.69.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.70.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.71.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.72.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.73.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.74.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.75.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.76.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.77.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.78.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.79.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.80.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.81.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.82.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.83.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.84.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.85.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.86.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.87.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.88.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.89.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.90.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.91.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.92.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.93.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.94.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.95.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.96.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.97.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.98.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.99.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.100.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.101.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.102.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.103.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.104.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.105.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.106.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.107.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.108.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.109.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.110.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.111.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.112.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.113.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.114.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.115.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.116.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.117.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.118.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.119.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.120.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.121.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.122.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.123.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.124.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.125.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.126.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.127.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.128.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.129.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.130.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.131.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.132.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.133.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.134.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.135.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.136.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.137.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.138.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.139.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.140.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.141.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.142.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.143.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.144.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.145.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.146.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.147.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.148.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.149.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.150.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.151.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.152.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.153.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.154.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.155.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.156.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.157.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.158.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.experts.159.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.shared_experts.gate_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.shared_experts.up_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.91.mlp.shared_experts.down_proj.weight": "model-00130-of-00132.safetensors", + "lm_head.weight": "model-00130-of-00132.safetensors", + "model.layers.69.input_layernorm.weight": "model-00130-of-00132.safetensors", + "model.layers.69.self_attn.q_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.69.self_attn.k_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.69.self_attn.v_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.69.self_attn.q_proj.bias": "model-00130-of-00132.safetensors", + "model.layers.69.self_attn.k_proj.bias": "model-00130-of-00132.safetensors", + "model.layers.69.self_attn.v_proj.bias": "model-00130-of-00132.safetensors", + "model.layers.69.self_attn.k_norm.weight": "model-00130-of-00132.safetensors", + "model.layers.69.post_attention_layernorm.weight": "model-00130-of-00132.safetensors", + "model.layers.69.mlp.gate.weight": "model-00130-of-00132.safetensors", + "model.layers.69.mlp.shared_experts.gate_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.69.mlp.shared_experts.up_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.69.mlp.shared_experts.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.70.self_attn.o_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.70.input_layernorm.weight": "model-00130-of-00132.safetensors", + "model.layers.70.self_attn.q_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.70.self_attn.k_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.70.self_attn.v_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.70.self_attn.q_proj.bias": "model-00130-of-00132.safetensors", + "model.layers.70.self_attn.k_proj.bias": "model-00130-of-00132.safetensors", + "model.layers.70.self_attn.v_proj.bias": "model-00130-of-00132.safetensors", + "model.layers.70.self_attn.k_norm.weight": "model-00130-of-00132.safetensors", + "model.layers.70.post_attention_layernorm.weight": "model-00130-of-00132.safetensors", + "model.layers.70.mlp.gate.weight": "model-00130-of-00132.safetensors", + "model.layers.70.mlp.gate.e_score_correction_bias": "model-00130-of-00132.safetensors", + "model.layers.70.mlp.shared_experts.down_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.71.input_layernorm.weight": "model-00130-of-00132.safetensors", + "model.layers.71.self_attn.q_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.71.self_attn.k_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.71.self_attn.v_proj.weight": "model-00130-of-00132.safetensors", + "model.layers.71.self_attn.q_proj.bias": "model-00130-of-00132.safetensors", + "model.layers.71.self_attn.k_proj.bias": "model-00130-of-00132.safetensors", + "model.layers.71.self_attn.v_proj.bias": "model-00130-of-00132.safetensors", + "model.layers.71.self_attn.k_norm.weight": "model-00130-of-00132.safetensors", + "model.layers.71.post_attention_layernorm.weight": "model-00130-of-00132.safetensors", + "model.layers.72.self_attn.o_proj.weight": "model-00131-of-00132.safetensors", + "model.layers.72.input_layernorm.weight": "model-00131-of-00132.safetensors", + "model.layers.72.self_attn.q_proj.weight": "model-00131-of-00132.safetensors", + "model.layers.72.self_attn.k_proj.weight": "model-00131-of-00132.safetensors", + "model.layers.72.self_attn.v_proj.weight": "model-00131-of-00132.safetensors", + "model.layers.72.self_attn.k_norm.weight": "model-00131-of-00132.safetensors", + "model.layers.72.post_attention_layernorm.weight": "model-00131-of-00132.safetensors", + "model.layers.72.mlp.gate.weight": "model-00131-of-00132.safetensors", + "model.layers.72.mlp.gate.e_score_correction_bias": "model-00131-of-00132.safetensors", + "model.layers.72.mlp.shared_experts.down_proj.weight": "model-00131-of-00132.safetensors", + "model.layers.73.input_layernorm.weight": "model-00131-of-00132.safetensors", + "model.layers.73.self_attn.q_proj.weight": "model-00131-of-00132.safetensors", + "model.layers.73.self_attn.k_proj.weight": "model-00131-of-00132.safetensors", + "model.layers.73.self_attn.v_proj.weight": "model-00131-of-00132.safetensors", + "model.layers.73.self_attn.q_proj.bias": "model-00131-of-00132.safetensors", + "model.layers.73.self_attn.k_proj.bias": "model-00131-of-00132.safetensors", + "model.layers.73.self_attn.v_proj.bias": "model-00131-of-00132.safetensors", + "model.layers.73.self_attn.k_norm.weight": "model-00131-of-00132.safetensors", + "model.layers.73.post_attention_layernorm.weight": "model-00131-of-00132.safetensors", + "model.layers.74.self_attn.o_proj.weight": "model-00131-of-00132.safetensors", + "model.layers.74.input_layernorm.weight": "model-00131-of-00132.safetensors", + "model.layers.74.self_attn.q_proj.weight": "model-00131-of-00132.safetensors", + "model.layers.74.self_attn.k_proj.weight": "model-00131-of-00132.safetensors", + "model.layers.74.self_attn.v_proj.weight": "model-00131-of-00132.safetensors", + "model.layers.74.self_attn.k_norm.weight": "model-00131-of-00132.safetensors", + "model.layers.74.post_attention_layernorm.weight": "model-00131-of-00132.safetensors", + "model.layers.74.mlp.gate.weight": "model-00131-of-00132.safetensors", + "model.layers.74.mlp.gate.e_score_correction_bias": "model-00131-of-00132.safetensors", + "model.layers.74.mlp.shared_experts.down_proj.weight": "model-00131-of-00132.safetensors", + "model.layers.75.input_layernorm.weight": "model-00131-of-00132.safetensors", + "model.layers.75.self_attn.q_proj.weight": "model-00131-of-00132.safetensors", + "model.layers.75.self_attn.k_proj.weight": "model-00131-of-00132.safetensors", + "model.layers.75.self_attn.v_proj.weight": "model-00131-of-00132.safetensors", + "model.layers.75.self_attn.q_proj.bias": "model-00131-of-00132.safetensors", + "model.layers.75.self_attn.k_proj.bias": "model-00131-of-00132.safetensors", + "model.layers.75.self_attn.v_proj.bias": "model-00131-of-00132.safetensors", + "model.layers.75.self_attn.k_norm.weight": "model-00131-of-00132.safetensors", + "model.layers.75.post_attention_layernorm.weight": "model-00131-of-00132.safetensors", + "model.layers.76.self_attn.o_proj.weight": "model-00131-of-00132.safetensors", + "model.layers.76.input_layernorm.weight": "model-00131-of-00132.safetensors", + "model.layers.76.self_attn.q_proj.weight": "model-00131-of-00132.safetensors", + "model.layers.76.self_attn.k_proj.weight": "model-00131-of-00132.safetensors", + "model.layers.76.self_attn.v_proj.weight": "model-00131-of-00132.safetensors", + "model.layers.76.self_attn.k_norm.weight": "model-00131-of-00132.safetensors", + "model.layers.76.post_attention_layernorm.weight": "model-00131-of-00132.safetensors", + "model.layers.76.mlp.gate.weight": "model-00131-of-00132.safetensors", + "model.layers.76.mlp.gate.e_score_correction_bias": "model-00131-of-00132.safetensors", + "model.layers.76.mlp.shared_experts.down_proj.weight": "model-00131-of-00132.safetensors", + "model.layers.77.input_layernorm.weight": "model-00131-of-00132.safetensors", + "model.layers.77.self_attn.q_proj.weight": "model-00131-of-00132.safetensors", + "model.layers.77.self_attn.k_proj.weight": "model-00131-of-00132.safetensors", + "model.layers.77.self_attn.v_proj.weight": "model-00131-of-00132.safetensors", + "model.layers.77.self_attn.q_proj.bias": "model-00131-of-00132.safetensors", + "model.layers.77.self_attn.k_proj.bias": "model-00131-of-00132.safetensors", + "model.layers.77.self_attn.v_proj.bias": "model-00131-of-00132.safetensors", + "model.layers.77.self_attn.k_norm.weight": "model-00131-of-00132.safetensors", + "model.layers.77.post_attention_layernorm.weight": "model-00131-of-00132.safetensors", + "model.layers.78.self_attn.o_proj.weight": "model-00131-of-00132.safetensors", + "model.layers.78.input_layernorm.weight": "model-00131-of-00132.safetensors", + "model.layers.78.self_attn.q_proj.weight": "model-00131-of-00132.safetensors", + "model.layers.78.self_attn.k_proj.weight": "model-00131-of-00132.safetensors", + "model.layers.78.self_attn.v_proj.weight": "model-00131-of-00132.safetensors", + "model.layers.78.self_attn.k_norm.weight": "model-00131-of-00132.safetensors", + "model.layers.78.post_attention_layernorm.weight": "model-00131-of-00132.safetensors", + "model.layers.78.mlp.gate.weight": "model-00131-of-00132.safetensors", + "model.layers.78.mlp.gate.e_score_correction_bias": "model-00131-of-00132.safetensors", + "model.layers.78.mlp.shared_experts.down_proj.weight": "model-00131-of-00132.safetensors", + "model.layers.79.input_layernorm.weight": "model-00131-of-00132.safetensors", + "model.layers.79.self_attn.q_proj.weight": "model-00131-of-00132.safetensors", + "model.layers.79.self_attn.k_proj.weight": "model-00131-of-00132.safetensors", + "model.layers.79.self_attn.v_proj.weight": "model-00131-of-00132.safetensors", + "model.layers.79.self_attn.q_proj.bias": "model-00131-of-00132.safetensors", + "model.layers.79.self_attn.k_proj.bias": "model-00131-of-00132.safetensors", + "model.layers.79.self_attn.v_proj.bias": "model-00131-of-00132.safetensors", + "model.layers.79.self_attn.k_norm.weight": "model-00131-of-00132.safetensors", + "model.layers.79.post_attention_layernorm.weight": "model-00131-of-00132.safetensors", + "model.layers.80.self_attn.o_proj.weight": "model-00131-of-00132.safetensors", + "model.layers.80.input_layernorm.weight": "model-00131-of-00132.safetensors", + "model.layers.80.self_attn.k_norm.weight": "model-00131-of-00132.safetensors", + "model.layers.80.post_attention_layernorm.weight": "model-00131-of-00132.safetensors", + "model.layers.80.mlp.gate.weight": "model-00131-of-00132.safetensors", + "model.layers.80.mlp.gate.e_score_correction_bias": "model-00131-of-00132.safetensors", + "model.layers.80.mlp.shared_experts.down_proj.weight": "model-00131-of-00132.safetensors", + "model.layers.81.input_layernorm.weight": "model-00131-of-00132.safetensors", + "model.layers.81.self_attn.q_proj.weight": "model-00131-of-00132.safetensors", + "model.layers.81.self_attn.k_proj.weight": "model-00131-of-00132.safetensors", + "model.layers.81.self_attn.v_proj.weight": "model-00131-of-00132.safetensors", + "model.layers.81.self_attn.q_proj.bias": "model-00131-of-00132.safetensors", + "model.layers.81.self_attn.k_proj.bias": "model-00131-of-00132.safetensors", + "model.layers.81.self_attn.v_proj.bias": "model-00131-of-00132.safetensors", + "model.layers.81.self_attn.k_norm.weight": "model-00131-of-00132.safetensors", + "model.layers.81.post_attention_layernorm.weight": "model-00131-of-00132.safetensors", + "model.layers.82.self_attn.o_proj.weight": "model-00131-of-00132.safetensors", + "model.layers.82.input_layernorm.weight": "model-00131-of-00132.safetensors", + "model.layers.82.self_attn.k_norm.weight": "model-00131-of-00132.safetensors", + "model.layers.82.post_attention_layernorm.weight": "model-00131-of-00132.safetensors", + "model.layers.82.mlp.gate.weight": "model-00131-of-00132.safetensors", + "model.layers.82.mlp.gate.e_score_correction_bias": "model-00131-of-00132.safetensors", + "model.layers.82.mlp.shared_experts.down_proj.weight": "model-00131-of-00132.safetensors", + "model.layers.83.input_layernorm.weight": "model-00131-of-00132.safetensors", + "model.layers.83.self_attn.q_proj.weight": "model-00131-of-00132.safetensors", + "model.layers.83.self_attn.k_proj.weight": "model-00131-of-00132.safetensors", + "model.layers.83.self_attn.v_proj.weight": "model-00131-of-00132.safetensors", + "model.layers.83.self_attn.q_proj.bias": "model-00131-of-00132.safetensors", + "model.layers.83.self_attn.k_proj.bias": "model-00131-of-00132.safetensors", + "model.layers.83.self_attn.v_proj.bias": "model-00131-of-00132.safetensors", + "model.layers.83.self_attn.k_norm.weight": "model-00131-of-00132.safetensors", + "model.layers.83.post_attention_layernorm.weight": "model-00131-of-00132.safetensors", + "model.layers.84.self_attn.o_proj.weight": "model-00131-of-00132.safetensors", + "model.layers.84.self_attn.k_norm.weight": "model-00131-of-00132.safetensors", + "model.layers.84.post_attention_layernorm.weight": "model-00131-of-00132.safetensors", + "model.layers.84.mlp.gate.weight": "model-00131-of-00132.safetensors", + "model.layers.84.mlp.gate.e_score_correction_bias": "model-00131-of-00132.safetensors", + "model.layers.84.mlp.shared_experts.down_proj.weight": "model-00131-of-00132.safetensors", + "model.layers.85.self_attn.q_proj.weight": "model-00131-of-00132.safetensors", + "model.layers.85.self_attn.k_proj.weight": "model-00131-of-00132.safetensors", + "model.layers.85.self_attn.v_proj.weight": "model-00131-of-00132.safetensors", + "model.layers.85.self_attn.q_proj.bias": "model-00131-of-00132.safetensors", + "model.layers.85.self_attn.k_proj.bias": "model-00131-of-00132.safetensors", + "model.layers.85.self_attn.v_proj.bias": "model-00131-of-00132.safetensors", + "model.layers.85.self_attn.k_norm.weight": "model-00131-of-00132.safetensors", + "model.layers.85.post_attention_layernorm.weight": "model-00131-of-00132.safetensors", + "model.layers.86.self_attn.o_proj.weight": "model-00131-of-00132.safetensors", + "model.layers.86.self_attn.k_norm.weight": "model-00131-of-00132.safetensors", + "model.layers.86.post_attention_layernorm.weight": "model-00131-of-00132.safetensors", + "model.layers.86.mlp.gate.weight": "model-00131-of-00132.safetensors", + "model.layers.86.mlp.gate.e_score_correction_bias": "model-00131-of-00132.safetensors", + "model.layers.86.mlp.shared_experts.down_proj.weight": "model-00131-of-00132.safetensors", + "model.layers.87.self_attn.q_proj.weight": "model-00131-of-00132.safetensors", + "model.layers.87.self_attn.k_proj.weight": "model-00131-of-00132.safetensors", + "model.layers.87.self_attn.v_proj.weight": "model-00131-of-00132.safetensors", + "model.layers.87.self_attn.q_proj.bias": "model-00131-of-00132.safetensors", + "model.layers.87.self_attn.k_proj.bias": "model-00131-of-00132.safetensors", + "model.layers.87.self_attn.v_proj.bias": "model-00131-of-00132.safetensors", + "model.layers.87.self_attn.k_norm.weight": "model-00131-of-00132.safetensors", + "model.layers.87.post_attention_layernorm.weight": "model-00131-of-00132.safetensors", + "model.layers.88.self_attn.o_proj.weight": "model-00131-of-00132.safetensors", + "model.layers.88.self_attn.k_norm.weight": "model-00131-of-00132.safetensors", + "model.layers.88.post_attention_layernorm.weight": "model-00131-of-00132.safetensors", + "model.layers.88.mlp.gate.weight": "model-00131-of-00132.safetensors", + "model.layers.88.mlp.gate.e_score_correction_bias": "model-00131-of-00132.safetensors", + "model.layers.88.mlp.shared_experts.down_proj.weight": "model-00131-of-00132.safetensors", + "model.layers.89.self_attn.q_proj.weight": "model-00131-of-00132.safetensors", + "model.layers.89.self_attn.k_proj.weight": "model-00131-of-00132.safetensors", + "model.layers.89.self_attn.v_proj.weight": "model-00131-of-00132.safetensors", + "model.layers.89.self_attn.q_proj.bias": "model-00131-of-00132.safetensors", + "model.layers.89.self_attn.k_proj.bias": "model-00131-of-00132.safetensors", + "model.layers.89.self_attn.v_proj.bias": "model-00131-of-00132.safetensors", + "model.layers.89.self_attn.k_norm.weight": "model-00131-of-00132.safetensors", + "model.layers.89.post_attention_layernorm.weight": "model-00131-of-00132.safetensors", + "model.layers.90.self_attn.o_proj.weight": "model-00131-of-00132.safetensors", + "model.layers.90.self_attn.k_norm.weight": "model-00131-of-00132.safetensors", + "model.layers.90.post_attention_layernorm.weight": "model-00131-of-00132.safetensors", + "model.layers.90.mlp.gate.weight": "model-00131-of-00132.safetensors", + "model.layers.90.mlp.gate.e_score_correction_bias": "model-00131-of-00132.safetensors", + "model.layers.90.mlp.shared_experts.down_proj.weight": "model-00131-of-00132.safetensors", + "model.layers.91.self_attn.q_proj.weight": "model-00131-of-00132.safetensors", + "model.layers.91.self_attn.k_proj.weight": "model-00131-of-00132.safetensors", + "model.layers.91.self_attn.v_proj.weight": "model-00131-of-00132.safetensors", + "model.layers.91.self_attn.q_proj.bias": "model-00131-of-00132.safetensors", + "model.layers.91.self_attn.k_proj.bias": "model-00131-of-00132.safetensors", + "model.layers.91.self_attn.v_proj.bias": "model-00131-of-00132.safetensors", + "model.layers.91.self_attn.k_norm.weight": "model-00131-of-00132.safetensors", + "model.layers.91.post_attention_layernorm.weight": "model-00131-of-00132.safetensors", + "model.norm.weight": "model-00131-of-00132.safetensors" + } +} \ No newline at end of file diff --git a/tokenizer.json b/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..43a71efad1ab3f7e4d66d1e48e7cc44f68f21f3a --- /dev/null +++ b/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9340665016419c825c4bdabbcc9acc43b7ca2c68ce142724afa829abb1be5efd +size 19970699 diff --git a/tokenizer_config.json b/tokenizer_config.json new file mode 100644 index 0000000000000000000000000000000000000000..053f12c9b03d5acbcc921042ea0c87a6baa5d3f7 --- /dev/null +++ b/tokenizer_config.json @@ -0,0 +1,325 @@ +{ + "added_tokens_decoder": { + "151329": { + "content": "<|endoftext|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151330": { + "content": "[MASK]", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151331": { + "content": "[gMASK]", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151332": { + "content": "[sMASK]", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151333": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151334": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151335": { + "content": "<|system|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151336": { + "content": "<|user|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151337": { + "content": "<|assistant|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151338": { + "content": "<|observation|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151339": { + "content": "<|begin_of_image|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151340": { + "content": "<|end_of_image|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151341": { + "content": "<|begin_of_video|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151342": { + "content": "<|end_of_video|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151343": { + "content": "<|begin_of_audio|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151344": { + "content": "<|end_of_audio|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151345": { + "content": "<|begin_of_transcription|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151346": { + "content": "<|end_of_transcription|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151347": { + "content": "<|code_prefix|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151348": { + "content": "<|code_middle|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151349": { + "content": "<|code_suffix|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151350": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151351": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151352": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151353": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151354": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151355": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151356": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151357": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151358": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151359": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151360": { + "content": "/nothink", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151361": { + "content": "<|begin_of_box|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151362": { + "content": "<|end_of_box|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151363": { + "content": "<|image|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151364": { + "content": "<|video|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + } + }, + "additional_special_tokens": [ + "<|endoftext|>", + "[MASK]", + "[gMASK]", + "[sMASK]", + "", + "", + "<|system|>", + "<|user|>", + "<|assistant|>", + "<|observation|>", + "<|begin_of_image|>", + "<|end_of_image|>", + "<|begin_of_video|>", + "<|end_of_video|>", + "<|begin_of_audio|>", + "<|end_of_audio|>", + "<|begin_of_transcription|>", + "<|end_of_transcription|>", + "<|code_prefix|>", + "<|code_middle|>", + "<|code_suffix|>", + "/nothink" + ], + "clean_up_tokenization_spaces": false, + "do_lower_case": false, + "eos_token": "<|endoftext|>", + "extra_special_tokens": {}, + "model_max_length": 128000, + "pad_token": "<|endoftext|>", + "padding_side": "left", + "remove_space": false, + "tokenizer_class": "PreTrainedTokenizer" +}