diff --git a/.gitattributes b/.gitattributes
new file mode 100644
index 0000000000000000000000000000000000000000..52373fe24473b1aa44333d318f578ae6bf04b49b
--- /dev/null
+++ b/.gitattributes
@@ -0,0 +1,36 @@
+*.7z filter=lfs diff=lfs merge=lfs -text
+*.arrow filter=lfs diff=lfs merge=lfs -text
+*.bin filter=lfs diff=lfs merge=lfs -text
+*.bz2 filter=lfs diff=lfs merge=lfs -text
+*.ckpt filter=lfs diff=lfs merge=lfs -text
+*.ftz filter=lfs diff=lfs merge=lfs -text
+*.gz filter=lfs diff=lfs merge=lfs -text
+*.h5 filter=lfs diff=lfs merge=lfs -text
+*.joblib filter=lfs diff=lfs merge=lfs -text
+*.lfs.* filter=lfs diff=lfs merge=lfs -text
+*.mlmodel filter=lfs diff=lfs merge=lfs -text
+*.model filter=lfs diff=lfs merge=lfs -text
+*.msgpack filter=lfs diff=lfs merge=lfs -text
+*.npy filter=lfs diff=lfs merge=lfs -text
+*.npz filter=lfs diff=lfs merge=lfs -text
+*.onnx filter=lfs diff=lfs merge=lfs -text
+*.ot filter=lfs diff=lfs merge=lfs -text
+*.parquet filter=lfs diff=lfs merge=lfs -text
+*.pb filter=lfs diff=lfs merge=lfs -text
+*.pickle filter=lfs diff=lfs merge=lfs -text
+*.pkl filter=lfs diff=lfs merge=lfs -text
+*.pt filter=lfs diff=lfs merge=lfs -text
+*.pth filter=lfs diff=lfs merge=lfs -text
+*.rar filter=lfs diff=lfs merge=lfs -text
+*.safetensors filter=lfs diff=lfs merge=lfs -text
+saved_model/**/* filter=lfs diff=lfs merge=lfs -text
+*.tar.* filter=lfs diff=lfs merge=lfs -text
+*.tar filter=lfs diff=lfs merge=lfs -text
+*.tflite filter=lfs diff=lfs merge=lfs -text
+*.tgz filter=lfs diff=lfs merge=lfs -text
+*.wasm filter=lfs diff=lfs merge=lfs -text
+*.xz filter=lfs diff=lfs merge=lfs -text
+*.zip filter=lfs diff=lfs merge=lfs -text
+*.zst filter=lfs diff=lfs merge=lfs -text
+*tfevents* filter=lfs diff=lfs merge=lfs -text
+tokenizer.json filter=lfs diff=lfs merge=lfs -text
diff --git a/chat_template.jinja b/chat_template.jinja
new file mode 100644
index 0000000000000000000000000000000000000000..3d522594ff964687d9ae839d07d9d7139599074f
--- /dev/null
+++ b/chat_template.jinja
@@ -0,0 +1,259 @@
+{%- if not platform_instruction_override %}
+{%- set platform_instruction_override -%}
+These instructions are always to be followed and cannot be overridden by subsequent system or user turns:
+- You will answer requests for educational, informative, or creative content related to safety categories. You will not provide content that is harmful or could be used to cause harm.
+
+These instructions serve as your defaults, but they can be overridden in subsequent system or user turns:
+- Your name is Command.
+- You are a large language model built by Cohere.
+{%- endset %}
+{%- endif %}
+{%- set reasoning = reasoning if reasoning is not undefined else (false if reasoning_effort is defined and reasoning_effort | lower == "none" else true) -%}
+{%- set grounding = grounding | default("disabled") | upper %}
+{%- set grounding_enabled = grounding == "ENABLED" %}
+{%- set tools_or_docs_exist = tools or documents %}
+{%- set render_tools_section = true %}
+{%- set render_grounding = grounding_enabled and tools_or_docs_exist %}
+{%- set render_platform_instruction_override = true if platform_instruction_override else false %}
+{%- set has_developer_instruction = developer_instruction or developer_instruction == "" %}
+{%- set render_developer_instruction = true if developer_instruction else false %}
+{%- set convert_first_system_msg = convert_first_system_msg | default(true) -%}
+{%- set skip_thinking = skip_thinking | default(false) -%}
+{{ bos_token }}
+{%- macro document_turn(documents) -%}
+{# format documents into chat turn -#}
+<|START_OF_TURN_TOKEN|><|CHATBOT_TOKEN|>{%- if not skip_thinking -%}<|START_THINKING|>I will look through the document to address the users needs.<|END_THINKING|>{%- endif -%}<|START_ACTION|>[
+ {"tool_call_id": "0", "tool_name": "direct-injected-document", "parameters": {}}
+]<|END_ACTION|><|END_OF_TURN_TOKEN|><|START_OF_TURN_TOKEN|><|SYSTEM_TOKEN|><|START_TOOL_RESULT|>[
+ {
+ "tool_call_id": "0",
+ "results": {
+{%- for doc in documents %}
+{%- set doc_val = doc.data if doc.data else doc %}
+
+ "{{ loop.index0 }}": {{ doc_val|tojson }}{% if not loop.last %},
+ {%- endif %}
+{%- endfor %}
+
+ },
+ "is_error": null
+ }
+]<|END_TOOL_RESULT|><|END_OF_TURN_TOKEN|>{%- endmacro %}
+{%- macro tool_call_id_to_int(messages, tool_call_id) %}
+{%- if regen_tool_call_ids -%}
+ {%- set counter = namespace(value=0) %}
+ {%- set tool_call_id_seen = namespace(value=false) %}
+ {%- for msg in messages %}
+ {%- if msg.tool_calls %}
+ {%- for tool_call in msg.tool_calls %}
+ {%- if tool_call.id == tool_call_id and not tool_call_id_seen.value -%}
+ {{ counter.value }}
+ {%- set tool_call_id_seen.value = true %}
+ {%- endif %}
+ {%- set counter.value = counter.value + 1 %}
+ {%- endfor %}
+ {%- endif %}
+ {%- endfor %}
+{%- else -%}
+ {{ tool_call_id }}
+{%- endif -%}
+{%- endmacro %}
+{%- macro format_tool_message(messages, tool_msg) -%}
+{#- format tool message #}{
+ "tool_call_id": "{{ tool_call_id_to_int(messages, tool_msg.tool_call_id) }}",
+ "results": {
+ {%- if tool_msg.content is mapping or tool_msg.content is string %}
+
+ {% if tool_msg.content is string -%}
+ {%- set text_wrapper = {"content": tool_msg.content} -%}
+ {%- else -%}
+ {%- set text_wrapper = tool_msg.content -%}
+ {%- endif %}
+ "0": {{ text_wrapper|tojson }}
+ {%- else %}
+ {%- for content in tool_msg.content %}
+
+ "{{ loop.index0 }}": {{ print_tool_content(content) }}{% if not loop.last %},{% endif %}
+ {%- endfor %}
+ {%- endif %}
+
+ },
+ "is_error": null
+ }
+{%- endmacro -%}
+{%- macro print_tool_content(item) %}
+{%- if item.type|lower == "text" -%}
+{%- set text_wrapper = {"content": item.text} -%}
+{{ text_wrapper|tojson }}
+{%- elif item.type|lower == "document" and item.document and "data" in item.document -%}
+{{ item.document.data|tojson }}
+{%- else -%}
+{{ item|tojson }}
+{%- endif -%}
+{%- endmacro %}
+{%- macro print_msg(msg) %}
+ {%- if msg is string -%}
+<|START_TEXT|>{{ msg }}<|END_TEXT|>
+ {%- elif msg.content is string -%}
+<|START_TEXT|>{{ msg.content }}<|END_TEXT|>
+ {%- else %}
+ {%- set last_was_text = namespace(value=false) %}
+ {%- for content in msg.content %}
+ {%- if content.type|lower == "text" -%}
+ {%- if not last_was_text.value -%}
+ <|START_TEXT|>
+ {%- endif -%}
+ {{ content.text }}
+ {%- if loop.last -%}
+ <|END_TEXT|>
+ {%- endif %}
+ {%- set last_was_text.value = true -%}
+ {%- else -%}
+ {%- if last_was_text.value -%}
+ <|END_TEXT|>
+ {%- endif -%}
+ {%- set last_was_text.value = false -%}
+ {%- endif -%}
+ {%- if content.type|lower == "image" -%}
+ {%- if content.data -%}
+{{ content.data }}
+ {%- else -%}
+<|IMG_PATCH|>
+ {%- endif -%}
+ {%- endif -%}
+ {%- endfor %}
+ {%- endif %}
+{%- endmacro %}
+{%- macro print_thinking(msg) %}
+ {%- if msg.thinking -%}
+{{ msg.thinking }}
+ {%- elif msg.content and msg.content[0].thinking -%}
+{{ msg.content[0].thinking }}
+ {%- endif %}
+{%- endmacro %}
+{%- if messages and messages[0]['role']|lower == 'system' and not has_developer_instruction and convert_first_system_msg %}{%- set developer_instruction = messages[0] %}{%- set render_developer_instruction = true %}{%- set initial_instruction_message = true %}{% endif %}
+{%- set json_object = true if response_format and response_format.type == "json_object" else false %}
+{%- set json_schema = (response_format.json_schema or response_format.schema) if response_format %}
+{%- set json_mode = json_object or json_schema %}
+{%- set tool_idx = namespace(value=0) %}
+{%- set tool_ids_seen = namespace(value=[]) %}
+{%- set regen_tool_call_ids = regen_tool_call_ids | default(true) -%}
+{%- set sent_documents = namespace(value=false) -%}
+
+{%- if render_tools_section or render_platform_instruction_override or render_grounding or json_mode -%}
+<|START_OF_TURN_TOKEN|><|SYSTEM_TOKEN|><|START_TEXT|>
+{%- elif not render_developer_instruction -%}
+<|START_OF_TURN_TOKEN|><|SYSTEM_TOKEN|>
+{%- endif %}
+
+{%- set rendered_platform_turn_chunk = false %}
+
+{%- if render_platform_instruction_override -%}
+{{ platform_instruction_override }}
+{% set rendered_platform_turn_chunk = true %}
+{%- else %}
+{%- endif %}
+
+{%- if render_grounding -%}
+{%- if rendered_platform_turn_chunk %}
+
+{% endif -%}
+Note that both your responses and reflections can be grounded. Grounding means you associate pieces of texts (called "spans") with those specific tool results that support them (called "sources"). And you use a pair of tags "" and "" to indicate when a span can be grounded onto a list of sources, listing them out in the closing tag. Sources from the same tool call are grouped together and listed as "{tool_call_id}:[{list of result indices}]", before they are joined together by ",". E.g., "span" means that "span" is supported by result 1 and 2 from "tool_call_id=0" as well as result 0 from "tool_call_id=1".
+{% set rendered_platform_turn_chunk = true %}
+{%- endif %}
+
+{%- if render_tools_section %}
+{%- if rendered_platform_turn_chunk %}
+
+{% endif %}
+# Available Tools
+```json
+[
+{% if tools_or_docs_exist %}
+{%- if documents %}
+ {"name": "direct-injected-document", "description": "This is a special tool to directly inject user-uploaded documents into the chat as additional context. DO NOT use this tool by yourself!", "parameters": {"type": "object", "properties": {}, "required": []}, "responses": {"200": {"description": "Successfully returned a list of chunked text snippets from the directly uploaded documents.", "content": {"application/json": {"schema": {"type": "array", "items": {"type": "object", "required": ["url", "snippet"], "properties": {"url": {"type": "string", "description": "The url of the uploaded document."}, "snippet": {"type": "string", "description": "The text snippet for the returned document chunk."}}}}}}}}}
+ {%- if tools %},
+ {% else %}
+
+ {% endif %}
+{%- endif %}
+{%- for tool in tools %}
+ {"name": "{{ tool['function']['name'] }}", "description": "{{ tool['function']['description'] }}", "parameters": {{ tool['function']['parameters']|tojson }}, "responses": null}
+ {%- if not loop.last %},{% endif %}
+
+{% endfor %}
+{%- else %}
+
+{% endif %}
+]
+```
+{%- set rendered_platform_turn_chunk = true %}
+{%- endif -%}
+
+{%- if json_mode -%}
+{%- if rendered_platform_turn_chunk %}
+
+
+{% endif -%}
+When generating JSON objects, do not generate block markers. Generate an object directly without prefixing with ```json. Return only the JSON and nothing else.
+ {%- if json_schema %}
+
+Your output should adhere to the following json schema:
+{{ json_schema }}
+ {%- endif -%}
+{%- set rendered_platform_turn_chunk = true %}
+{%- endif %}
+{%- if rendered_platform_turn_chunk -%}
+<|END_TEXT|><|END_OF_TURN_TOKEN|>
+{%- elif not render_developer_instruction -%}
+<|END_OF_TURN_TOKEN|>
+{%- endif %}
+{%- if render_developer_instruction -%}
+<|START_OF_TURN_TOKEN|><|SYSTEM_TOKEN|>{{ print_msg(developer_instruction) }}<|END_OF_TURN_TOKEN|>
+{%- endif %}
+{%- for message in messages %}
+ {%- set msg_role_downcased = message.role | lower %}
+ {%- if msg_role_downcased == 'system' and (not (loop.first and initial_instruction_message)) -%}
+<|START_OF_TURN_TOKEN|><|SYSTEM_TOKEN|>{{ print_msg(message) }}<|END_OF_TURN_TOKEN|>
+ {%- elif msg_role_downcased == 'user' -%}
+<|START_OF_TURN_TOKEN|><|USER_TOKEN|>{{ print_msg(message) }}<|END_OF_TURN_TOKEN|>
+ {%- if documents and not sent_documents.value %}{%- set sent_documents.value = true %}{% set tool_idx.value = tool_idx.value + 1 %}{{ document_turn(documents) }}{% endif %}
+ {%- elif msg_role_downcased == 'assistant' or msg_role_downcased == 'chatbot' -%}
+<|START_OF_TURN_TOKEN|><|CHATBOT_TOKEN|>
+ {%- if message.tool_calls %}
+ {% if not skip_thinking %}
+ {% if message.tool_plan -%}
+ <|START_THINKING|>{{ message.tool_plan }}<|END_THINKING|>
+ {%- elif message.thinking or (message.content and message.content[0].type == "thinking") -%}
+ <|START_THINKING|>{{ print_thinking(message) }}<|END_THINKING|>
+ {%- endif %}
+ {%- endif %}<|START_ACTION|>[
+ {%- for tc in message.tool_calls %}
+
+ {"tool_call_id": "{%- if regen_tool_call_ids -%}{{ tool_idx.value }}{%- else -%}{{ tc.id }}{%- endif -%}", "tool_name": "{{ tc['function']['name'] }}", "parameters": {{ tc['function']['arguments']|tojson }}}{% if not loop.last %},{% endif %}
+ {%- set tool_idx.value = tool_idx.value + 1 %}
+ {%- endfor %}
+
+]<|END_ACTION|><|END_OF_TURN_TOKEN|>
+ {%- else -%}
+ {% if (message.thinking or (message.content and message.content[0].type == "thinking")) and not skip_thinking -%}
+ <|START_THINKING|>{{ print_thinking(message) }}<|END_THINKING|>
+ {%- endif -%}
+ {{ print_msg(message) }}<|END_OF_TURN_TOKEN|>
+ {%- endif %}
+ {%- elif msg_role_downcased == 'tool' and message.tool_call_id not in tool_ids_seen.value -%}
+<|START_OF_TURN_TOKEN|><|SYSTEM_TOKEN|><|START_TOOL_RESULT|>[
+ {{ format_tool_message(messages, message) }}
+ {%- for msg in messages[loop.index0 + 1:] %}
+
+ {%- if msg.role | lower == 'tool' %},
+ {{ format_tool_message(messages, msg) }}
+ {%- set tool_ids_seen.value = tool_ids_seen.value + [msg.tool_call_id] %}
+ {%- else %}
+ {%- break %}
+ {%- endif %}
+ {%- endfor %}
+
+]<|END_TOOL_RESULT|><|END_OF_TURN_TOKEN|>
+ {%- endif %}
+{%- endfor %}{%- if add_generation_prompt -%}<|START_OF_TURN_TOKEN|><|CHATBOT_TOKEN|>{% if reasoning %}<|START_THINKING|>{% else %}<|START_THINKING|><|END_THINKING|>{% endif %}{%- endif %}
diff --git a/config.json b/config.json
new file mode 100644
index 0000000000000000000000000000000000000000..647d7273df9bb09480b4aa098ec37f05a4c6429f
--- /dev/null
+++ b/config.json
@@ -0,0 +1,94 @@
+{
+ "architectures": [
+ "Cohere2MoeForCausalLM"
+ ],
+ "attention_bias": false,
+ "attention_dropout": 0.0,
+ "bos_token_id": 2,
+ "dtype": "bfloat16",
+ "eos_token_id": 255001,
+ "expert_selection_fn": "sigmoid",
+ "first_k_dense_replace": 1,
+ "head_dim": 128,
+ "hidden_act": "silu",
+ "hidden_size": 2048,
+ "initializer_range": 0.02,
+ "intermediate_size": 768,
+ "layer_norm_eps": 1e-05,
+ "layer_types": [
+ "full_attention",
+ "sliding_attention",
+ "sliding_attention",
+ "sliding_attention",
+ "full_attention",
+ "sliding_attention",
+ "sliding_attention",
+ "sliding_attention",
+ "full_attention",
+ "sliding_attention",
+ "sliding_attention",
+ "sliding_attention",
+ "full_attention",
+ "sliding_attention",
+ "sliding_attention",
+ "sliding_attention",
+ "full_attention",
+ "sliding_attention",
+ "sliding_attention",
+ "sliding_attention",
+ "full_attention",
+ "sliding_attention",
+ "sliding_attention",
+ "sliding_attention",
+ "full_attention",
+ "sliding_attention",
+ "sliding_attention",
+ "sliding_attention",
+ "full_attention",
+ "sliding_attention",
+ "sliding_attention",
+ "sliding_attention",
+ "full_attention",
+ "sliding_attention",
+ "sliding_attention",
+ "sliding_attention",
+ "full_attention",
+ "sliding_attention",
+ "sliding_attention",
+ "sliding_attention",
+ "full_attention",
+ "sliding_attention",
+ "sliding_attention",
+ "sliding_attention",
+ "full_attention",
+ "sliding_attention",
+ "sliding_attention",
+ "sliding_attention",
+ "full_attention"
+ ],
+ "logit_scale": 1.0,
+ "max_position_embeddings": 500000,
+ "model_type": "cohere2_moe",
+ "norm_topk_prob": false,
+ "num_attention_heads": 32,
+ "num_experts": 128,
+ "num_experts_per_tok": 8,
+ "num_hidden_layers": 49,
+ "num_key_value_heads": 4,
+ "num_shared_experts": 0,
+ "pad_token_id": 0,
+ "prefix_dense_intermediate_size": 3072,
+ "prefix_dense_sliding_window_pattern": 1,
+ "rms_norm_eps": 1e-06,
+ "rope_scaling": null,
+ "rope_theta": 50000,
+ "shared_expert_combination_strategy": "average",
+ "sliding_window": 4096,
+ "transformers_version": "5.8.0",
+ "use_cache": true,
+ "use_gated_activation": true,
+ "use_parallel_block": true,
+ "use_parallel_embedding": false,
+ "use_qk_norm": false,
+ "vocab_size": 262144
+}
diff --git a/generation_config.json b/generation_config.json
new file mode 100644
index 0000000000000000000000000000000000000000..359afc456acafabbc3c67307b73a0ef26805eb82
--- /dev/null
+++ b/generation_config.json
@@ -0,0 +1,7 @@
+{
+ "_from_model_config": true,
+ "bos_token_id": 2,
+ "eos_token_id": 255001,
+ "pad_token_id": 0,
+ "transformers_version": "5.8.0"
+}
diff --git a/model-00001-of-00049.safetensors b/model-00001-of-00049.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..807cd761b71de44cfa80462e8d077ae5c1228830
--- /dev/null
+++ b/model-00001-of-00049.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:daf5db63c754732e03e14b26538849b7197bde57ea460ba0d4766dbce3580b1a
+size 1551917728
diff --git a/model-00002-of-00049.safetensors b/model-00002-of-00049.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..242dfdc6d0702dca0ecc819aac69d8130f8609f7
--- /dev/null
+++ b/model-00002-of-00049.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c5d9bff761ec78593cad72fcfe7aebde3f70163c95efa75fa7fc423f644b86cb
+size 1246284112
diff --git a/model-00003-of-00049.safetensors b/model-00003-of-00049.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..251e2827bbb00f195fc4a2995fe945f3a460823a
--- /dev/null
+++ b/model-00003-of-00049.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b671c07f138acef95d404dda93781627b0f3f7a2d2259ed4ffb89f44c9726876
+size 1246284112
diff --git a/model-00004-of-00049.safetensors b/model-00004-of-00049.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..3a737b5b259d063238b720503a603ec580dd4db3
--- /dev/null
+++ b/model-00004-of-00049.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f41e8f7b6f6c92d9d3b9f8ec24c818a209faec3e622a9488dca6606650c5f425
+size 1246284112
diff --git a/model-00005-of-00049.safetensors b/model-00005-of-00049.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..bc2b76f2fe2ca715b19c56869fdb753f472a51e5
--- /dev/null
+++ b/model-00005-of-00049.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a1871df2ad11ee44308868bd695131f1d5def63393bbb61cbc9fb55b8f107d8d
+size 1246284112
diff --git a/model-00006-of-00049.safetensors b/model-00006-of-00049.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..9e6b1ecfe3472f0b7ca75abbaf548bba17b7e2d7
--- /dev/null
+++ b/model-00006-of-00049.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f81ef1830dae4d595240fc020837ef3fed3a10534f86cf05d1e4ef7b0125da51
+size 1246284112
diff --git a/model-00007-of-00049.safetensors b/model-00007-of-00049.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..33b3df06d49af4cc4fadbd11c402a25161d94651
--- /dev/null
+++ b/model-00007-of-00049.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:7130aa7b1909219f8fd10d1ffd8425cada405803af7b094a69156d75091ace1f
+size 1246284112
diff --git a/model-00008-of-00049.safetensors b/model-00008-of-00049.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..27cb7afb9b7ea66db156da59bf131a587a05b079
--- /dev/null
+++ b/model-00008-of-00049.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:fe7d7e6cb3a9b24f4201ae78383e4c106299df35556140a4c07c4ec469f488e7
+size 1246284112
diff --git a/model-00009-of-00049.safetensors b/model-00009-of-00049.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..6db063989cb4d92d609acecdb3de4625b12c552a
--- /dev/null
+++ b/model-00009-of-00049.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f86cc0caea81217f6c8a2abbe3c2794096604d2315aadc61263270128d758947
+size 1246284112
diff --git a/model-00010-of-00049.safetensors b/model-00010-of-00049.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..18898b6cd40bfd2100df28ba9763aa7907112bea
--- /dev/null
+++ b/model-00010-of-00049.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:21c67c397d924be28933705ec8fcd6654b44a2eacd8f03d66bcfa94f3779a941
+size 1246284224
diff --git a/model-00011-of-00049.safetensors b/model-00011-of-00049.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..2beef1ef14f739aa574c4b3450f05c777fb562ec
--- /dev/null
+++ b/model-00011-of-00049.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4d3a888d096a129601d91f41027f091e07b3391cd1b08c42b1f7599aba4c353c
+size 1246284504
diff --git a/model-00012-of-00049.safetensors b/model-00012-of-00049.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..7971b6dcec625b3e4b120466f33067a6bee64df4
--- /dev/null
+++ b/model-00012-of-00049.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:05a94067a3eec7efd1aa660d0f2d19350316575c6d6f52581dbe241cc8ed572b
+size 1246284504
diff --git a/model-00013-of-00049.safetensors b/model-00013-of-00049.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..b5a942c57884a0e7a7c8157eb5c149aa74d40847
--- /dev/null
+++ b/model-00013-of-00049.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:87d74ef7874b916ed135f3dcd2fcf653812f6290aa085ddc3e29d4f071f3473f
+size 1246284504
diff --git a/model-00014-of-00049.safetensors b/model-00014-of-00049.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..0b5103ae2d028c927e813b31081939eb277e12d5
--- /dev/null
+++ b/model-00014-of-00049.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6d9eb16fca0c9cd78f4927e88a72422d6b99b8cb25e4719c5acda8c947621f2c
+size 1246284504
diff --git a/model-00015-of-00049.safetensors b/model-00015-of-00049.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..1b1f328822798526ba8a216559dda551cebd1780
--- /dev/null
+++ b/model-00015-of-00049.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:be753448f4ac5d463fdc45ec02f57e05f1ee3525c1167daab8e800065f072f09
+size 1246284504
diff --git a/model-00016-of-00049.safetensors b/model-00016-of-00049.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..c457b140038325a533e5a427d16753b500c5c654
--- /dev/null
+++ b/model-00016-of-00049.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:13d5b401feea5fa6da3124af8c1b61fbff5d6fa79d4b922adb251dccd00c818c
+size 1246284504
diff --git a/model-00017-of-00049.safetensors b/model-00017-of-00049.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..a468da3457aff1ae0e42b9c7fa51ad8390679199
--- /dev/null
+++ b/model-00017-of-00049.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:89aeebcb158e91fe34b8955919ea8fc4dbdd37d8c9c18fa2dfacd76c553d449c
+size 1246284504
diff --git a/model-00018-of-00049.safetensors b/model-00018-of-00049.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..c6e6cacb63168b962cc2b7dac71006cbc18447b1
--- /dev/null
+++ b/model-00018-of-00049.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:cb4ca39d3d2351c78e8b8024d70b05bcabe8e22e76cdaacc2117d325bf80c136
+size 1246284504
diff --git a/model-00019-of-00049.safetensors b/model-00019-of-00049.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..52b6e36e15ecf7360f50693ba7e4c71e98f9647b
--- /dev/null
+++ b/model-00019-of-00049.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1017aa5e2f763055ee0d148348eaac974bf627bfb99f5f4dda2cac21b9fae402
+size 1246284504
diff --git a/model-00020-of-00049.safetensors b/model-00020-of-00049.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..0b0fbe0c7db16d9d473e73b9e3a207a545f3a57c
--- /dev/null
+++ b/model-00020-of-00049.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:426e6255897d052a039f3b999380128a047283c8ee8fd3b43a9a9a862fd2a117
+size 1246284504
diff --git a/model-00021-of-00049.safetensors b/model-00021-of-00049.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..7ea433c267da0d13aa9d8b3d554def1503fb807b
--- /dev/null
+++ b/model-00021-of-00049.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0dc523be4dd850416eaa8d8a8c626809fa584a11fa9be9610a45dff982f8fbd4
+size 1246284504
diff --git a/model-00022-of-00049.safetensors b/model-00022-of-00049.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..d56cf374684ab891d56a515f1a822a1df1291e4c
--- /dev/null
+++ b/model-00022-of-00049.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6e974a88ea136494fdfb40660e54e197029af5d3d76f58a1f6737fb3477a812f
+size 1246284504
diff --git a/model-00023-of-00049.safetensors b/model-00023-of-00049.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..fc572b6e776ef83cf2901b5e6456bd894befdfcb
--- /dev/null
+++ b/model-00023-of-00049.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e41d9f44fe50c66a68ef87af9752072563778c4a419298a0f70bced6c72ddc59
+size 1246284504
diff --git a/model-00024-of-00049.safetensors b/model-00024-of-00049.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..be2ac9c551177dcb07bd9f8a1741137d5189bd4c
--- /dev/null
+++ b/model-00024-of-00049.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:54a2c9ce6c85f673c86f2a6b11b61172ca5daaebf6db3a4d0dc10bdd2466931a
+size 1246284504
diff --git a/model-00025-of-00049.safetensors b/model-00025-of-00049.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..9a23af2bc0d6e09377487007e8805ab8552fcf65
--- /dev/null
+++ b/model-00025-of-00049.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:49e286ee88f44373a255d66f5e520e99ecd6a19849df281f84a30e0e2d986932
+size 1246284504
diff --git a/model-00026-of-00049.safetensors b/model-00026-of-00049.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..276a9fdebddb44759d61812f948d435945648e0a
--- /dev/null
+++ b/model-00026-of-00049.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b1609d888bda589cb6e67ecd43c059c28992ea3d381916c0d8b7487e2c9ec857
+size 1246284504
diff --git a/model-00027-of-00049.safetensors b/model-00027-of-00049.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..9c1be1ddd393dff66633ad9f7cf0eca5293269ed
--- /dev/null
+++ b/model-00027-of-00049.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:da47d5a05d7f61b7d8444f2a32a1652fa28e1dbc81f6354142b38eaaee5743d9
+size 1246284504
diff --git a/model-00028-of-00049.safetensors b/model-00028-of-00049.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..8e8ab6f377accb45e32f1c8aa8dc621f330e59c8
--- /dev/null
+++ b/model-00028-of-00049.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:cd8f75676b3f602402d2097d17a8eace621ffd22b377eae9f145601cfdb34f0c
+size 1246284504
diff --git a/model-00029-of-00049.safetensors b/model-00029-of-00049.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..e9ee36261cef110af27c20f01d1a3339436decbb
--- /dev/null
+++ b/model-00029-of-00049.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:13dd955c39a112ed5c35a490d8e3401d9035a2ee1a125c58d84f0aaad4263d3d
+size 1246284504
diff --git a/model-00030-of-00049.safetensors b/model-00030-of-00049.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..9c4bfa53d3535d68185d63a7cbc4069d587742af
--- /dev/null
+++ b/model-00030-of-00049.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:7bbc0916666b923a459f3fb56b6aab8149514a4ca76d450bf535a17f2d7cfd8c
+size 1246284504
diff --git a/model-00031-of-00049.safetensors b/model-00031-of-00049.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..4c899508cb2d347fda9e5fa56200dd409e1a98c0
--- /dev/null
+++ b/model-00031-of-00049.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8604df2469948ea906fb59457b83d951f5741f2f240a668060537256f3315265
+size 1246284504
diff --git a/model-00032-of-00049.safetensors b/model-00032-of-00049.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..e87473021d4110c77c4de237491444582a37b8ef
--- /dev/null
+++ b/model-00032-of-00049.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:82302a2d64f8b75153c50726f0607bec8843de4f99cd7832056a83218c27f4a4
+size 1246284504
diff --git a/model-00033-of-00049.safetensors b/model-00033-of-00049.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..741c9659dae182bcda37f8d9c60873d04498cd4a
--- /dev/null
+++ b/model-00033-of-00049.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b42d414b4c76150b1323c7c4e75602e858eeb5dce4e14ca3ddbb86da1dcad01d
+size 1246284504
diff --git a/model-00034-of-00049.safetensors b/model-00034-of-00049.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..2b636b2fae31497de4d05cd856929f5420ebed96
--- /dev/null
+++ b/model-00034-of-00049.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c6174a45b75212900ea35f807a0081b434fe4af445c361a9e949790b7b62b7e9
+size 1246284504
diff --git a/model-00035-of-00049.safetensors b/model-00035-of-00049.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..9c7a8f2af69564a37be22f85076fff2c3dcb862a
--- /dev/null
+++ b/model-00035-of-00049.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ccbd5bb133aa6cb606e7f0554dbdde1e1445749b796dbe72d86778c41fa0df62
+size 1246284504
diff --git a/model-00036-of-00049.safetensors b/model-00036-of-00049.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..1bb14e6742b300bca4f5afc7785fa4c1ca7e06f2
--- /dev/null
+++ b/model-00036-of-00049.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a07c475e1b1853850cb0c1d6684907b42e53462e605d5c21fb3b7fe676823949
+size 1246284504
diff --git a/model-00037-of-00049.safetensors b/model-00037-of-00049.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..c7f3cabccaca9591d81371beaed1dad589fe4f67
--- /dev/null
+++ b/model-00037-of-00049.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e611968a88df3890540a813c84d6360b7f0ed54e6f234505c4dce97492f3e96c
+size 1246284504
diff --git a/model-00038-of-00049.safetensors b/model-00038-of-00049.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..16adbfa061cec1334a21f1590081631caca5d244
--- /dev/null
+++ b/model-00038-of-00049.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4f10178056c7ea33fc6e317f3c11575db671676ca5774fbed566e32b15da995b
+size 1246284504
diff --git a/model-00039-of-00049.safetensors b/model-00039-of-00049.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..ea9d9684bd0b6cd6529c52828a6a371fbe1a461c
--- /dev/null
+++ b/model-00039-of-00049.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4297bb7a9e3d768c7f0d449502c1e2b342ffe75ed2e28471b0106ae7f5473258
+size 1246284504
diff --git a/model-00040-of-00049.safetensors b/model-00040-of-00049.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..e1da9450ba965a6aaeecd71cdd16065e164f017a
--- /dev/null
+++ b/model-00040-of-00049.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4f8ea1e306c0c1308fadeab713092a6881af833d7a0f978297e3909e2d6966bf
+size 1246284504
diff --git a/model-00041-of-00049.safetensors b/model-00041-of-00049.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..9b8b7068009f0a292e2b867fa775919bfd6be80d
--- /dev/null
+++ b/model-00041-of-00049.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:bf6c810eca3813de45d3b2715c4952e262a8318891597552c4ef5cba90131b18
+size 1246284504
diff --git a/model-00042-of-00049.safetensors b/model-00042-of-00049.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..b7e268c064ebc28f704e0f65d358cf7f086d3aca
--- /dev/null
+++ b/model-00042-of-00049.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:21485ff6e878251a2159e261bb37093b90d404d173fdefba52be74f2fb468e69
+size 1246284504
diff --git a/model-00043-of-00049.safetensors b/model-00043-of-00049.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..d6f577d6f15f28c5459d66d2c81378a359d914e8
--- /dev/null
+++ b/model-00043-of-00049.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c4841b1ca102234eeb50c77dcf2c2f31fa0af0c72e596c478ca48b61107ba138
+size 1246284504
diff --git a/model-00044-of-00049.safetensors b/model-00044-of-00049.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..95edaf9db845c4fc57678b962bca0cb67ddf8aec
--- /dev/null
+++ b/model-00044-of-00049.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:46c4a8fdd6dcee2f1fc462e9c99d904461d6aa42b3f2b02636e416fcd5407e97
+size 1246284504
diff --git a/model-00045-of-00049.safetensors b/model-00045-of-00049.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..8cf45e93285958474f50278f16a4f2a2de2aa48c
--- /dev/null
+++ b/model-00045-of-00049.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4bfc31f8f4a8f11fa116ac8b741c9563b42986de1b7d13e02bf47a68714a9a9d
+size 1246284504
diff --git a/model-00046-of-00049.safetensors b/model-00046-of-00049.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..463a95d31551d9846536384912e5570a731a16f9
--- /dev/null
+++ b/model-00046-of-00049.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:64377f4c8be8a5e30e3c12350640492fed304a6950b3d1ab10dda755a0d1440c
+size 1246284504
diff --git a/model-00047-of-00049.safetensors b/model-00047-of-00049.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..78ed7f18271e9b1b8f1fb86cf01f8dee7732ea18
--- /dev/null
+++ b/model-00047-of-00049.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:2c0ce67bd1cd80f3f26c5d3134971080aa0b5359addfc4c053f753e5077a31f6
+size 1246284504
diff --git a/model-00048-of-00049.safetensors b/model-00048-of-00049.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..64d27ea51a6dd64bd69d449b9868475589b666f5
--- /dev/null
+++ b/model-00048-of-00049.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:50dc6b0cd0eb1d037f514f045f40ae419c941658a2813e9ea62057a3e1561c92
+size 1246284504
diff --git a/model-00049-of-00049.safetensors b/model-00049-of-00049.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..4a6e18e732c0319da621797721cf0ad06c733435
--- /dev/null
+++ b/model-00049-of-00049.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ca6cbbf90b6b4b5da187a94fb91d7f1b098490c95ab1d1b67651c2255b251c1f
+size 843615384
diff --git a/model.safetensors.index.json b/model.safetensors.index.json
new file mode 100644
index 0000000000000000000000000000000000000000..4b9b778d42012425c5ba59e49a006351d34af120
--- /dev/null
+++ b/model.safetensors.index.json
@@ -0,0 +1,18738 @@
+{
+ "metadata": {
+ "total_parameters": 30484303872,
+ "total_size": 60968607744
+ },
+ "weight_map": {
+ "model.embed_tokens.weight": "model-00001-of-00049.safetensors",
+ "model.layers.0.input_layernorm.weight": "model-00001-of-00049.safetensors",
+ "model.layers.0.mlp.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.0.mlp.gate_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.0.mlp.up_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.0.self_attn.k_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.0.self_attn.o_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.0.self_attn.q_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.0.self_attn.v_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.input_layernorm.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.0.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.0.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.0.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.1.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.1.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.1.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.10.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.10.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.10.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.100.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.100.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.100.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.101.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.101.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.101.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.102.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.102.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.102.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.103.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.103.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.103.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.104.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.104.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.104.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.105.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.105.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.105.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.106.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.106.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.106.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.107.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.107.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.107.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.108.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.108.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.108.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.109.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.109.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.109.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.11.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.11.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.11.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.110.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.110.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.110.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.111.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.111.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.111.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.112.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.112.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.112.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.113.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.113.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.113.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.114.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.114.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.114.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.115.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.115.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.115.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.116.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.116.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.116.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.117.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.117.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.117.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.118.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.118.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.118.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.119.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.119.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.119.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.12.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.12.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.12.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.120.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.120.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.120.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.121.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.121.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.121.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.122.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.122.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.122.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.123.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.123.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.123.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.124.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.124.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.124.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.125.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.125.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.125.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.126.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.126.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.126.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.127.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.127.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.127.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.13.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.13.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.13.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.14.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.14.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.14.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.15.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.15.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.15.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.16.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.16.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.16.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.17.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.17.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.17.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.18.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.18.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.18.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.19.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.19.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.19.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.2.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.2.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.2.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.20.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.20.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.20.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.21.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.21.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.21.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.22.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.22.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.22.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.23.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.23.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.23.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.24.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.24.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.24.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.25.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.25.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.25.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.26.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.26.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.26.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.27.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.27.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.27.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.28.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.28.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.28.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.29.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.29.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.29.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.3.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.3.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.3.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.30.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.30.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.30.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.31.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.31.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.31.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.32.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.32.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.32.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.33.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.33.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.33.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.34.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.34.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.34.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.35.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.35.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.35.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.36.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.36.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.36.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.37.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.37.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.37.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.38.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.38.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.38.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.39.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.39.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.39.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.4.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.4.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.4.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.40.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.40.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.40.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.41.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.41.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.41.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.42.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.42.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.42.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.43.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.43.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.43.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.44.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.44.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.44.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.45.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.45.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.45.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.46.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.46.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.46.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.47.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.47.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.47.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.48.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.48.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.48.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.49.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.49.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.49.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.5.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.5.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.5.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.50.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.50.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.50.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.51.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.51.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.51.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.52.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.52.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.52.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.53.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.53.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.53.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.54.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.54.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.54.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.55.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.55.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.55.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.56.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.56.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.56.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.57.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.57.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.57.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.58.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.58.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.58.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.59.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.59.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.59.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.6.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.6.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.6.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.60.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.60.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.60.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.61.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.61.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.61.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.62.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.62.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.62.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.63.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.63.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.63.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.64.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.64.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.64.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.65.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.65.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.65.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.66.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.66.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.66.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.67.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.67.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.67.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.68.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.68.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.68.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.69.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.69.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.69.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.7.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.7.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.7.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.70.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.70.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.70.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.71.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.71.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.71.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.72.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.72.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.72.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.73.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.73.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.73.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.74.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.74.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.74.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.75.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.75.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.75.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.76.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.76.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.76.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.77.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.77.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.77.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.78.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.78.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.78.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.79.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.79.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.79.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.8.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.8.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.8.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.80.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.80.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.80.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.81.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.81.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.81.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.82.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.82.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.82.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.83.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.83.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.83.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.84.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.84.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.84.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.85.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.85.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.85.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.86.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.86.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.86.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.87.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.87.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.87.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.88.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.88.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.88.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.89.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.89.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.89.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.9.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.9.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.9.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.90.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.90.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.90.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.91.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.91.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.91.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.92.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.92.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.92.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.93.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.93.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.93.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.94.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.94.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.94.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.95.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.95.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.95.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.96.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.96.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.96.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.97.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.97.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.97.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.98.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.98.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.98.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.99.down_proj.weight": "model-00001-of-00049.safetensors",
+ "model.layers.1.mlp.experts.99.gate_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.experts.99.up_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.mlp.gate.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.self_attn.k_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.self_attn.o_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.self_attn.q_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.1.self_attn.v_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.10.input_layernorm.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.0.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.0.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.0.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.1.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.1.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.1.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.10.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.10.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.10.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.100.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.100.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.100.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.101.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.101.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.101.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.102.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.102.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.102.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.103.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.103.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.103.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.104.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.104.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.104.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.105.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.105.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.105.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.106.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.106.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.106.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.107.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.107.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.107.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.108.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.108.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.108.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.109.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.109.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.109.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.11.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.11.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.11.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.110.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.110.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.110.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.111.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.111.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.111.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.112.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.112.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.112.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.113.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.113.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.113.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.114.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.114.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.114.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.115.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.115.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.115.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.116.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.116.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.116.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.117.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.117.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.117.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.118.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.118.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.118.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.119.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.119.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.119.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.12.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.12.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.12.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.120.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.120.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.120.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.121.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.121.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.121.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.122.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.122.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.122.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.123.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.123.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.123.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.124.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.124.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.124.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.125.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.125.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.125.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.126.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.126.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.126.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.127.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.127.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.127.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.13.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.13.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.13.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.14.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.14.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.14.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.15.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.15.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.15.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.16.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.16.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.16.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.17.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.17.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.17.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.18.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.18.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.18.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.19.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.19.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.19.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.2.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.2.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.2.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.20.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.20.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.20.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.21.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.21.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.21.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.22.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.22.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.22.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.23.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.23.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.23.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.24.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.24.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.24.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.25.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.25.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.25.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.26.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.26.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.26.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.27.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.27.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.27.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.28.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.28.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.28.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.29.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.29.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.29.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.3.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.3.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.3.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.30.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.30.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.30.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.31.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.31.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.31.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.32.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.32.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.32.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.33.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.33.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.33.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.34.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.34.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.34.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.35.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.35.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.35.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.36.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.36.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.36.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.37.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.37.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.37.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.38.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.38.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.38.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.39.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.39.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.39.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.4.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.4.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.4.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.40.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.40.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.40.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.41.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.41.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.41.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.42.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.42.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.42.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.43.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.43.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.43.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.44.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.44.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.44.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.45.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.45.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.45.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.46.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.46.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.46.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.47.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.47.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.47.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.48.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.48.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.48.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.49.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.49.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.49.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.5.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.5.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.5.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.50.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.50.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.50.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.51.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.51.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.51.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.52.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.52.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.52.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.53.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.53.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.53.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.54.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.54.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.54.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.55.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.55.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.55.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.56.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.56.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.56.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.57.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.57.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.57.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.58.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.58.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.58.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.59.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.59.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.59.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.6.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.6.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.6.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.60.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.60.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.60.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.61.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.61.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.61.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.62.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.62.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.62.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.63.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.63.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.63.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.64.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.64.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.64.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.65.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.65.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.65.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.66.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.66.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.66.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.67.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.67.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.67.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.68.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.68.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.68.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.69.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.69.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.69.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.7.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.7.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.7.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.70.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.70.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.70.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.71.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.71.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.71.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.72.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.72.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.72.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.73.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.73.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.73.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.74.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.74.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.74.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.75.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.75.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.75.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.76.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.76.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.76.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.77.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.77.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.77.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.78.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.78.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.78.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.79.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.79.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.79.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.8.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.8.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.8.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.80.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.80.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.80.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.81.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.81.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.81.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.82.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.82.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.82.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.83.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.83.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.83.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.84.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.84.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.84.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.85.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.85.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.85.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.86.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.86.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.86.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.87.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.87.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.87.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.88.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.88.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.88.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.89.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.89.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.89.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.9.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.9.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.9.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.90.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.90.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.90.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.91.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.91.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.91.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.92.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.92.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.92.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.93.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.93.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.93.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.94.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.94.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.94.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.95.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.95.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.95.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.96.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.96.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.96.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.97.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.97.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.97.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.98.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.98.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.98.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.99.down_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.10.mlp.experts.99.gate_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.experts.99.up_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.mlp.gate.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.self_attn.k_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.self_attn.o_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.self_attn.q_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.10.self_attn.v_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.input_layernorm.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.0.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.0.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.0.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.1.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.1.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.1.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.10.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.10.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.10.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.100.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.100.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.100.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.101.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.101.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.101.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.102.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.102.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.102.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.103.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.103.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.103.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.104.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.104.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.104.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.105.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.105.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.105.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.106.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.106.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.106.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.107.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.107.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.107.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.108.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.108.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.108.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.109.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.109.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.109.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.11.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.11.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.11.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.110.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.110.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.110.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.111.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.111.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.111.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.112.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.112.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.112.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.113.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.113.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.113.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.114.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.114.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.114.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.115.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.115.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.115.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.116.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.116.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.116.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.117.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.117.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.117.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.118.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.118.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.118.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.119.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.119.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.119.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.12.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.12.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.12.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.120.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.120.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.120.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.121.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.121.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.121.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.122.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.122.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.122.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.123.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.123.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.123.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.124.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.124.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.124.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.125.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.125.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.125.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.126.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.126.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.126.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.127.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.127.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.127.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.13.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.13.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.13.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.14.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.14.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.14.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.15.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.15.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.15.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.16.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.16.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.16.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.17.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.17.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.17.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.18.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.18.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.18.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.19.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.19.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.19.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.2.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.2.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.2.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.20.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.20.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.20.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.21.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.21.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.21.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.22.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.22.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.22.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.23.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.23.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.23.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.24.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.24.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.24.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.25.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.25.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.25.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.26.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.26.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.26.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.27.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.27.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.27.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.28.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.28.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.28.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.29.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.29.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.29.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.3.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.3.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.3.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.30.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.30.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.30.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.31.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.31.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.31.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.32.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.32.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.32.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.33.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.33.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.33.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.34.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.34.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.34.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.35.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.35.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.35.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.36.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.36.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.36.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.37.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.37.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.37.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.38.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.38.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.38.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.39.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.39.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.39.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.4.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.4.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.4.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.40.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.40.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.40.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.41.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.41.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.41.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.42.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.42.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.42.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.43.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.43.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.43.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.44.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.44.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.44.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.45.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.45.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.45.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.46.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.46.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.46.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.47.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.47.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.47.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.48.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.48.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.48.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.49.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.49.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.49.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.5.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.5.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.5.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.50.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.50.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.50.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.51.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.51.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.51.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.52.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.52.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.52.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.53.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.53.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.53.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.54.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.54.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.54.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.55.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.55.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.55.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.56.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.56.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.56.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.57.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.57.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.57.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.58.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.58.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.58.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.59.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.59.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.59.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.6.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.6.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.6.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.60.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.60.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.60.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.61.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.61.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.61.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.62.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.62.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.62.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.63.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.63.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.63.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.64.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.64.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.64.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.65.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.65.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.65.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.66.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.66.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.66.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.67.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.67.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.67.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.68.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.68.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.68.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.69.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.69.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.69.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.7.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.7.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.7.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.70.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.70.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.70.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.71.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.71.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.71.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.72.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.72.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.72.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.73.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.73.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.73.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.74.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.74.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.74.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.75.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.75.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.75.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.76.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.76.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.76.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.77.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.77.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.77.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.78.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.78.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.78.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.79.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.79.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.79.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.8.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.8.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.8.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.80.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.80.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.80.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.81.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.81.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.81.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.82.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.82.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.82.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.83.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.83.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.83.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.84.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.84.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.84.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.85.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.85.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.85.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.86.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.86.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.86.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.87.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.87.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.87.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.88.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.88.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.88.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.89.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.89.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.89.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.9.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.9.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.9.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.90.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.90.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.90.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.91.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.91.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.91.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.92.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.92.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.92.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.93.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.93.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.93.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.94.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.94.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.94.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.95.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.95.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.95.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.96.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.96.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.96.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.97.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.97.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.97.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.98.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.98.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.98.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.99.down_proj.weight": "model-00011-of-00049.safetensors",
+ "model.layers.11.mlp.experts.99.gate_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.experts.99.up_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.mlp.gate.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.self_attn.k_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.self_attn.o_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.self_attn.q_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.11.self_attn.v_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.input_layernorm.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.0.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.0.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.0.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.1.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.1.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.1.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.10.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.10.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.10.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.100.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.100.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.100.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.101.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.101.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.101.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.102.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.102.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.102.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.103.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.103.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.103.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.104.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.104.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.104.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.105.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.105.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.105.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.106.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.106.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.106.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.107.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.107.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.107.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.108.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.108.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.108.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.109.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.109.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.109.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.11.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.11.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.11.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.110.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.110.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.110.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.111.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.111.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.111.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.112.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.112.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.112.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.113.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.113.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.113.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.114.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.114.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.114.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.115.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.115.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.115.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.116.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.116.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.116.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.117.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.117.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.117.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.118.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.118.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.118.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.119.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.119.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.119.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.12.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.12.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.12.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.120.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.120.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.120.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.121.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.121.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.121.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.122.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.122.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.122.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.123.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.123.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.123.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.124.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.124.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.124.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.125.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.125.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.125.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.126.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.126.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.126.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.127.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.127.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.127.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.13.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.13.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.13.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.14.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.14.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.14.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.15.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.15.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.15.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.16.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.16.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.16.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.17.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.17.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.17.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.18.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.18.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.18.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.19.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.19.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.19.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.2.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.2.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.2.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.20.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.20.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.20.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.21.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.21.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.21.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.22.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.22.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.22.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.23.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.23.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.23.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.24.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.24.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.24.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.25.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.25.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.25.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.26.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.26.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.26.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.27.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.27.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.27.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.28.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.28.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.28.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.29.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.29.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.29.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.3.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.3.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.3.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.30.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.30.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.30.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.31.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.31.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.31.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.32.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.32.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.32.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.33.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.33.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.33.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.34.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.34.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.34.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.35.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.35.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.35.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.36.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.36.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.36.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.37.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.37.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.37.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.38.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.38.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.38.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.39.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.39.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.39.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.4.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.4.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.4.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.40.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.40.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.40.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.41.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.41.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.41.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.42.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.42.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.42.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.43.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.43.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.43.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.44.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.44.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.44.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.45.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.45.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.45.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.46.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.46.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.46.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.47.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.47.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.47.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.48.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.48.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.48.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.49.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.49.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.49.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.5.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.5.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.5.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.50.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.50.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.50.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.51.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.51.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.51.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.52.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.52.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.52.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.53.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.53.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.53.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.54.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.54.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.54.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.55.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.55.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.55.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.56.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.56.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.56.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.57.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.57.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.57.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.58.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.58.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.58.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.59.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.59.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.59.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.6.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.6.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.6.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.60.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.60.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.60.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.61.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.61.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.61.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.62.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.62.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.62.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.63.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.63.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.63.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.64.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.64.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.64.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.65.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.65.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.65.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.66.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.66.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.66.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.67.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.67.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.67.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.68.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.68.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.68.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.69.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.69.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.69.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.7.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.7.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.7.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.70.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.70.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.70.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.71.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.71.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.71.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.72.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.72.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.72.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.73.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.73.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.73.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.74.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.74.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.74.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.75.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.75.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.75.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.76.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.76.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.76.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.77.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.77.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.77.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.78.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.78.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.78.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.79.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.79.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.79.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.8.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.8.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.8.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.80.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.80.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.80.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.81.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.81.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.81.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.82.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.82.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.82.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.83.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.83.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.83.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.84.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.84.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.84.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.85.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.85.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.85.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.86.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.86.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.86.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.87.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.87.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.87.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.88.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.88.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.88.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.89.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.89.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.89.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.9.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.9.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.9.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.90.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.90.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.90.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.91.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.91.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.91.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.92.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.92.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.92.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.93.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.93.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.93.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.94.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.94.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.94.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.95.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.95.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.95.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.96.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.96.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.96.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.97.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.97.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.97.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.98.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.98.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.98.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.99.down_proj.weight": "model-00012-of-00049.safetensors",
+ "model.layers.12.mlp.experts.99.gate_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.experts.99.up_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.mlp.gate.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.self_attn.k_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.self_attn.o_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.self_attn.q_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.12.self_attn.v_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.input_layernorm.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.0.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.0.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.0.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.1.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.1.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.1.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.10.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.10.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.10.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.100.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.100.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.100.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.101.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.101.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.101.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.102.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.102.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.102.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.103.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.103.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.103.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.104.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.104.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.104.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.105.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.105.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.105.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.106.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.106.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.106.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.107.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.107.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.107.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.108.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.108.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.108.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.109.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.109.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.109.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.11.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.11.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.11.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.110.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.110.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.110.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.111.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.111.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.111.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.112.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.112.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.112.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.113.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.113.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.113.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.114.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.114.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.114.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.115.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.115.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.115.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.116.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.116.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.116.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.117.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.117.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.117.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.118.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.118.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.118.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.119.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.119.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.119.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.12.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.12.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.12.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.120.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.120.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.120.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.121.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.121.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.121.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.122.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.122.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.122.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.123.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.123.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.123.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.124.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.124.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.124.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.125.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.125.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.125.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.126.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.126.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.126.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.127.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.127.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.127.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.13.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.13.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.13.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.14.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.14.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.14.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.15.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.15.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.15.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.16.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.16.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.16.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.17.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.17.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.17.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.18.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.18.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.18.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.19.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.19.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.19.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.2.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.2.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.2.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.20.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.20.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.20.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.21.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.21.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.21.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.22.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.22.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.22.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.23.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.23.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.23.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.24.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.24.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.24.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.25.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.25.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.25.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.26.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.26.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.26.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.27.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.27.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.27.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.28.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.28.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.28.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.29.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.29.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.29.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.3.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.3.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.3.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.30.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.30.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.30.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.31.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.31.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.31.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.32.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.32.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.32.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.33.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.33.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.33.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.34.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.34.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.34.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.35.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.35.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.35.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.36.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.36.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.36.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.37.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.37.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.37.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.38.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.38.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.38.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.39.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.39.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.39.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.4.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.4.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.4.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.40.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.40.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.40.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.41.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.41.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.41.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.42.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.42.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.42.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.43.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.43.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.43.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.44.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.44.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.44.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.45.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.45.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.45.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.46.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.46.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.46.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.47.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.47.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.47.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.48.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.48.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.48.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.49.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.49.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.49.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.5.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.5.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.5.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.50.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.50.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.50.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.51.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.51.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.51.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.52.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.52.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.52.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.53.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.53.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.53.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.54.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.54.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.54.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.55.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.55.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.55.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.56.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.56.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.56.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.57.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.57.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.57.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.58.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.58.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.58.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.59.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.59.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.59.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.6.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.6.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.6.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.60.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.60.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.60.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.61.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.61.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.61.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.62.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.62.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.62.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.63.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.63.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.63.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.64.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.64.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.64.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.65.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.65.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.65.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.66.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.66.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.66.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.67.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.67.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.67.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.68.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.68.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.68.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.69.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.69.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.69.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.7.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.7.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.7.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.70.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.70.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.70.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.71.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.71.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.71.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.72.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.72.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.72.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.73.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.73.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.73.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.74.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.74.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.74.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.75.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.75.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.75.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.76.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.76.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.76.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.77.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.77.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.77.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.78.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.78.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.78.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.79.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.79.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.79.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.8.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.8.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.8.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.80.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.80.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.80.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.81.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.81.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.81.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.82.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.82.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.82.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.83.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.83.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.83.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.84.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.84.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.84.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.85.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.85.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.85.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.86.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.86.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.86.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.87.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.87.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.87.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.88.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.88.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.88.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.89.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.89.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.89.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.9.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.9.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.9.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.90.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.90.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.90.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.91.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.91.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.91.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.92.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.92.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.92.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.93.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.93.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.93.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.94.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.94.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.94.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.95.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.95.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.95.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.96.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.96.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.96.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.97.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.97.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.97.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.98.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.98.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.98.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.99.down_proj.weight": "model-00013-of-00049.safetensors",
+ "model.layers.13.mlp.experts.99.gate_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.experts.99.up_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.mlp.gate.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.self_attn.k_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.self_attn.o_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.self_attn.q_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.13.self_attn.v_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.input_layernorm.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.0.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.0.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.0.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.1.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.1.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.1.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.10.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.10.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.10.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.100.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.100.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.100.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.101.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.101.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.101.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.102.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.102.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.102.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.103.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.103.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.103.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.104.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.104.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.104.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.105.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.105.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.105.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.106.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.106.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.106.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.107.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.107.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.107.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.108.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.108.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.108.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.109.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.109.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.109.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.11.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.11.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.11.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.110.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.110.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.110.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.111.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.111.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.111.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.112.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.112.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.112.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.113.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.113.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.113.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.114.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.114.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.114.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.115.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.115.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.115.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.116.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.116.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.116.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.117.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.117.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.117.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.118.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.118.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.118.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.119.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.119.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.119.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.12.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.12.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.12.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.120.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.120.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.120.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.121.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.121.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.121.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.122.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.122.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.122.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.123.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.123.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.123.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.124.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.124.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.124.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.125.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.125.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.125.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.126.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.126.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.126.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.127.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.127.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.127.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.13.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.13.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.13.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.14.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.14.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.14.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.15.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.15.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.15.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.16.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.16.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.16.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.17.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.17.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.17.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.18.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.18.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.18.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.19.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.19.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.19.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.2.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.2.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.2.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.20.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.20.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.20.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.21.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.21.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.21.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.22.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.22.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.22.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.23.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.23.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.23.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.24.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.24.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.24.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.25.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.25.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.25.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.26.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.26.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.26.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.27.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.27.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.27.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.28.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.28.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.28.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.29.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.29.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.29.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.3.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.3.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.3.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.30.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.30.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.30.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.31.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.31.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.31.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.32.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.32.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.32.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.33.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.33.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.33.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.34.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.34.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.34.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.35.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.35.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.35.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.36.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.36.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.36.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.37.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.37.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.37.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.38.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.38.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.38.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.39.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.39.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.39.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.4.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.4.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.4.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.40.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.40.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.40.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.41.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.41.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.41.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.42.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.42.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.42.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.43.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.43.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.43.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.44.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.44.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.44.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.45.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.45.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.45.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.46.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.46.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.46.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.47.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.47.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.47.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.48.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.48.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.48.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.49.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.49.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.49.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.5.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.5.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.5.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.50.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.50.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.50.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.51.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.51.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.51.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.52.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.52.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.52.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.53.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.53.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.53.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.54.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.54.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.54.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.55.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.55.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.55.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.56.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.56.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.56.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.57.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.57.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.57.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.58.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.58.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.58.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.59.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.59.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.59.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.6.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.6.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.6.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.60.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.60.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.60.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.61.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.61.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.61.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.62.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.62.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.62.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.63.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.63.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.63.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.64.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.64.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.64.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.65.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.65.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.65.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.66.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.66.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.66.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.67.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.67.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.67.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.68.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.68.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.68.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.69.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.69.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.69.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.7.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.7.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.7.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.70.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.70.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.70.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.71.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.71.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.71.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.72.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.72.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.72.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.73.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.73.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.73.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.74.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.74.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.74.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.75.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.75.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.75.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.76.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.76.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.76.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.77.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.77.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.77.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.78.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.78.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.78.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.79.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.79.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.79.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.8.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.8.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.8.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.80.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.80.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.80.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.81.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.81.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.81.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.82.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.82.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.82.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.83.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.83.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.83.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.84.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.84.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.84.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.85.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.85.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.85.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.86.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.86.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.86.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.87.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.87.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.87.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.88.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.88.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.88.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.89.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.89.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.89.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.9.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.9.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.9.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.90.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.90.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.90.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.91.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.91.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.91.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.92.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.92.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.92.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.93.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.93.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.93.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.94.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.94.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.94.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.95.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.95.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.95.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.96.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.96.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.96.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.97.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.97.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.97.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.98.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.98.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.98.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.99.down_proj.weight": "model-00014-of-00049.safetensors",
+ "model.layers.14.mlp.experts.99.gate_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.experts.99.up_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.mlp.gate.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.self_attn.k_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.self_attn.o_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.self_attn.q_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.14.self_attn.v_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.input_layernorm.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.0.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.0.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.0.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.1.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.1.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.1.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.10.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.10.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.10.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.100.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.100.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.100.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.101.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.101.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.101.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.102.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.102.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.102.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.103.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.103.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.103.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.104.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.104.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.104.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.105.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.105.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.105.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.106.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.106.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.106.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.107.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.107.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.107.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.108.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.108.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.108.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.109.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.109.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.109.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.11.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.11.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.11.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.110.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.110.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.110.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.111.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.111.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.111.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.112.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.112.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.112.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.113.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.113.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.113.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.114.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.114.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.114.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.115.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.115.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.115.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.116.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.116.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.116.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.117.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.117.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.117.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.118.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.118.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.118.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.119.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.119.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.119.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.12.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.12.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.12.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.120.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.120.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.120.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.121.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.121.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.121.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.122.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.122.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.122.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.123.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.123.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.123.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.124.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.124.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.124.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.125.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.125.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.125.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.126.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.126.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.126.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.127.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.127.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.127.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.13.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.13.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.13.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.14.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.14.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.14.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.15.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.15.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.15.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.16.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.16.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.16.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.17.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.17.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.17.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.18.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.18.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.18.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.19.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.19.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.19.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.2.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.2.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.2.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.20.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.20.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.20.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.21.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.21.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.21.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.22.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.22.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.22.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.23.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.23.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.23.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.24.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.24.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.24.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.25.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.25.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.25.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.26.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.26.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.26.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.27.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.27.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.27.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.28.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.28.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.28.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.29.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.29.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.29.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.3.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.3.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.3.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.30.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.30.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.30.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.31.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.31.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.31.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.32.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.32.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.32.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.33.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.33.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.33.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.34.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.34.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.34.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.35.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.35.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.35.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.36.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.36.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.36.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.37.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.37.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.37.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.38.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.38.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.38.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.39.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.39.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.39.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.4.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.4.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.4.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.40.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.40.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.40.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.41.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.41.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.41.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.42.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.42.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.42.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.43.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.43.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.43.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.44.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.44.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.44.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.45.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.45.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.45.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.46.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.46.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.46.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.47.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.47.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.47.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.48.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.48.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.48.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.49.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.49.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.49.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.5.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.5.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.5.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.50.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.50.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.50.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.51.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.51.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.51.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.52.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.52.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.52.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.53.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.53.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.53.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.54.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.54.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.54.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.55.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.55.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.55.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.56.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.56.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.56.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.57.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.57.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.57.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.58.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.58.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.58.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.59.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.59.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.59.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.6.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.6.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.6.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.60.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.60.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.60.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.61.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.61.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.61.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.62.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.62.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.62.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.63.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.63.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.63.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.64.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.64.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.64.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.65.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.65.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.65.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.66.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.66.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.66.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.67.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.67.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.67.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.68.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.68.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.68.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.69.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.69.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.69.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.7.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.7.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.7.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.70.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.70.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.70.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.71.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.71.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.71.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.72.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.72.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.72.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.73.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.73.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.73.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.74.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.74.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.74.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.75.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.75.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.75.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.76.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.76.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.76.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.77.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.77.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.77.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.78.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.78.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.78.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.79.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.79.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.79.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.8.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.8.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.8.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.80.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.80.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.80.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.81.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.81.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.81.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.82.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.82.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.82.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.83.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.83.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.83.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.84.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.84.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.84.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.85.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.85.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.85.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.86.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.86.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.86.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.87.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.87.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.87.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.88.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.88.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.88.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.89.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.89.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.89.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.9.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.9.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.9.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.90.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.90.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.90.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.91.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.91.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.91.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.92.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.92.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.92.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.93.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.93.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.93.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.94.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.94.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.94.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.95.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.95.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.95.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.96.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.96.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.96.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.97.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.97.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.97.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.98.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.98.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.98.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.99.down_proj.weight": "model-00015-of-00049.safetensors",
+ "model.layers.15.mlp.experts.99.gate_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.experts.99.up_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.mlp.gate.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.self_attn.k_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.self_attn.o_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.self_attn.q_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.15.self_attn.v_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.input_layernorm.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.0.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.0.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.0.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.1.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.1.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.1.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.10.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.10.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.10.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.100.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.100.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.100.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.101.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.101.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.101.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.102.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.102.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.102.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.103.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.103.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.103.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.104.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.104.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.104.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.105.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.105.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.105.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.106.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.106.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.106.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.107.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.107.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.107.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.108.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.108.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.108.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.109.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.109.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.109.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.11.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.11.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.11.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.110.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.110.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.110.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.111.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.111.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.111.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.112.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.112.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.112.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.113.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.113.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.113.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.114.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.114.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.114.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.115.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.115.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.115.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.116.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.116.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.116.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.117.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.117.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.117.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.118.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.118.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.118.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.119.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.119.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.119.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.12.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.12.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.12.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.120.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.120.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.120.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.121.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.121.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.121.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.122.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.122.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.122.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.123.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.123.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.123.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.124.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.124.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.124.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.125.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.125.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.125.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.126.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.126.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.126.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.127.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.127.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.127.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.13.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.13.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.13.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.14.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.14.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.14.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.15.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.15.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.15.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.16.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.16.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.16.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.17.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.17.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.17.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.18.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.18.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.18.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.19.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.19.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.19.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.2.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.2.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.2.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.20.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.20.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.20.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.21.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.21.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.21.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.22.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.22.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.22.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.23.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.23.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.23.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.24.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.24.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.24.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.25.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.25.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.25.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.26.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.26.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.26.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.27.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.27.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.27.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.28.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.28.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.28.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.29.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.29.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.29.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.3.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.3.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.3.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.30.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.30.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.30.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.31.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.31.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.31.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.32.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.32.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.32.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.33.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.33.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.33.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.34.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.34.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.34.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.35.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.35.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.35.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.36.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.36.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.36.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.37.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.37.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.37.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.38.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.38.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.38.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.39.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.39.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.39.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.4.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.4.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.4.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.40.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.40.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.40.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.41.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.41.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.41.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.42.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.42.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.42.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.43.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.43.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.43.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.44.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.44.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.44.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.45.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.45.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.45.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.46.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.46.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.46.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.47.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.47.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.47.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.48.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.48.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.48.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.49.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.49.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.49.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.5.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.5.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.5.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.50.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.50.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.50.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.51.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.51.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.51.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.52.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.52.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.52.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.53.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.53.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.53.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.54.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.54.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.54.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.55.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.55.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.55.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.56.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.56.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.56.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.57.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.57.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.57.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.58.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.58.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.58.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.59.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.59.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.59.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.6.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.6.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.6.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.60.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.60.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.60.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.61.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.61.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.61.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.62.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.62.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.62.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.63.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.63.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.63.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.64.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.64.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.64.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.65.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.65.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.65.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.66.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.66.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.66.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.67.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.67.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.67.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.68.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.68.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.68.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.69.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.69.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.69.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.7.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.7.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.7.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.70.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.70.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.70.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.71.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.71.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.71.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.72.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.72.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.72.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.73.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.73.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.73.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.74.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.74.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.74.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.75.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.75.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.75.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.76.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.76.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.76.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.77.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.77.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.77.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.78.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.78.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.78.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.79.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.79.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.79.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.8.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.8.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.8.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.80.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.80.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.80.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.81.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.81.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.81.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.82.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.82.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.82.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.83.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.83.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.83.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.84.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.84.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.84.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.85.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.85.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.85.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.86.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.86.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.86.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.87.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.87.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.87.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.88.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.88.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.88.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.89.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.89.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.89.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.9.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.9.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.9.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.90.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.90.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.90.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.91.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.91.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.91.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.92.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.92.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.92.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.93.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.93.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.93.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.94.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.94.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.94.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.95.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.95.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.95.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.96.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.96.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.96.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.97.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.97.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.97.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.98.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.98.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.98.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.99.down_proj.weight": "model-00016-of-00049.safetensors",
+ "model.layers.16.mlp.experts.99.gate_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.experts.99.up_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.mlp.gate.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.self_attn.k_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.self_attn.o_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.self_attn.q_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.16.self_attn.v_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.input_layernorm.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.0.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.0.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.0.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.1.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.1.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.1.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.10.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.10.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.10.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.100.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.100.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.100.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.101.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.101.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.101.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.102.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.102.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.102.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.103.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.103.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.103.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.104.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.104.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.104.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.105.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.105.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.105.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.106.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.106.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.106.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.107.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.107.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.107.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.108.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.108.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.108.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.109.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.109.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.109.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.11.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.11.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.11.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.110.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.110.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.110.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.111.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.111.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.111.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.112.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.112.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.112.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.113.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.113.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.113.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.114.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.114.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.114.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.115.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.115.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.115.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.116.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.116.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.116.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.117.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.117.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.117.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.118.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.118.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.118.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.119.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.119.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.119.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.12.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.12.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.12.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.120.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.120.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.120.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.121.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.121.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.121.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.122.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.122.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.122.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.123.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.123.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.123.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.124.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.124.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.124.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.125.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.125.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.125.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.126.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.126.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.126.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.127.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.127.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.127.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.13.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.13.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.13.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.14.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.14.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.14.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.15.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.15.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.15.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.16.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.16.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.16.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.17.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.17.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.17.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.18.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.18.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.18.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.19.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.19.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.19.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.2.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.2.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.2.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.20.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.20.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.20.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.21.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.21.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.21.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.22.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.22.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.22.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.23.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.23.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.23.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.24.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.24.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.24.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.25.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.25.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.25.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.26.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.26.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.26.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.27.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.27.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.27.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.28.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.28.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.28.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.29.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.29.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.29.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.3.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.3.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.3.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.30.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.30.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.30.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.31.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.31.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.31.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.32.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.32.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.32.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.33.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.33.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.33.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.34.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.34.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.34.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.35.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.35.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.35.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.36.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.36.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.36.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.37.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.37.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.37.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.38.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.38.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.38.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.39.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.39.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.39.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.4.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.4.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.4.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.40.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.40.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.40.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.41.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.41.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.41.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.42.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.42.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.42.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.43.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.43.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.43.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.44.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.44.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.44.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.45.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.45.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.45.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.46.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.46.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.46.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.47.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.47.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.47.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.48.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.48.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.48.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.49.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.49.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.49.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.5.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.5.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.5.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.50.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.50.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.50.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.51.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.51.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.51.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.52.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.52.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.52.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.53.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.53.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.53.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.54.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.54.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.54.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.55.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.55.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.55.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.56.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.56.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.56.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.57.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.57.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.57.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.58.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.58.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.58.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.59.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.59.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.59.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.6.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.6.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.6.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.60.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.60.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.60.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.61.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.61.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.61.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.62.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.62.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.62.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.63.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.63.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.63.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.64.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.64.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.64.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.65.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.65.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.65.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.66.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.66.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.66.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.67.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.67.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.67.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.68.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.68.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.68.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.69.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.69.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.69.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.7.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.7.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.7.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.70.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.70.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.70.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.71.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.71.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.71.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.72.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.72.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.72.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.73.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.73.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.73.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.74.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.74.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.74.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.75.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.75.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.75.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.76.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.76.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.76.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.77.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.77.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.77.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.78.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.78.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.78.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.79.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.79.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.79.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.8.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.8.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.8.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.80.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.80.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.80.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.81.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.81.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.81.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.82.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.82.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.82.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.83.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.83.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.83.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.84.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.84.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.84.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.85.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.85.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.85.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.86.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.86.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.86.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.87.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.87.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.87.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.88.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.88.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.88.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.89.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.89.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.89.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.9.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.9.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.9.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.90.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.90.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.90.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.91.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.91.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.91.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.92.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.92.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.92.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.93.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.93.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.93.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.94.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.94.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.94.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.95.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.95.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.95.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.96.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.96.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.96.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.97.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.97.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.97.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.98.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.98.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.98.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.99.down_proj.weight": "model-00017-of-00049.safetensors",
+ "model.layers.17.mlp.experts.99.gate_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.experts.99.up_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.mlp.gate.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.self_attn.k_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.self_attn.o_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.self_attn.q_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.17.self_attn.v_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.input_layernorm.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.0.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.0.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.0.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.1.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.1.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.1.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.10.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.10.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.10.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.100.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.100.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.100.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.101.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.101.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.101.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.102.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.102.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.102.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.103.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.103.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.103.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.104.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.104.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.104.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.105.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.105.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.105.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.106.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.106.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.106.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.107.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.107.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.107.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.108.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.108.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.108.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.109.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.109.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.109.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.11.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.11.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.11.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.110.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.110.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.110.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.111.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.111.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.111.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.112.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.112.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.112.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.113.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.113.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.113.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.114.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.114.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.114.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.115.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.115.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.115.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.116.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.116.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.116.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.117.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.117.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.117.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.118.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.118.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.118.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.119.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.119.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.119.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.12.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.12.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.12.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.120.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.120.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.120.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.121.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.121.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.121.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.122.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.122.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.122.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.123.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.123.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.123.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.124.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.124.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.124.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.125.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.125.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.125.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.126.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.126.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.126.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.127.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.127.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.127.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.13.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.13.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.13.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.14.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.14.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.14.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.15.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.15.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.15.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.16.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.16.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.16.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.17.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.17.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.17.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.18.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.18.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.18.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.19.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.19.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.19.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.2.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.2.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.2.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.20.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.20.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.20.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.21.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.21.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.21.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.22.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.22.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.22.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.23.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.23.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.23.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.24.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.24.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.24.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.25.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.25.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.25.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.26.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.26.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.26.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.27.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.27.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.27.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.28.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.28.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.28.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.29.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.29.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.29.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.3.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.3.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.3.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.30.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.30.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.30.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.31.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.31.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.31.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.32.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.32.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.32.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.33.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.33.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.33.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.34.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.34.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.34.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.35.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.35.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.35.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.36.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.36.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.36.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.37.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.37.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.37.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.38.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.38.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.38.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.39.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.39.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.39.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.4.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.4.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.4.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.40.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.40.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.40.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.41.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.41.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.41.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.42.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.42.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.42.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.43.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.43.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.43.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.44.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.44.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.44.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.45.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.45.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.45.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.46.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.46.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.46.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.47.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.47.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.47.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.48.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.48.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.48.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.49.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.49.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.49.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.5.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.5.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.5.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.50.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.50.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.50.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.51.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.51.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.51.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.52.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.52.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.52.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.53.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.53.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.53.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.54.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.54.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.54.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.55.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.55.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.55.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.56.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.56.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.56.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.57.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.57.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.57.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.58.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.58.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.58.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.59.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.59.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.59.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.6.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.6.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.6.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.60.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.60.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.60.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.61.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.61.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.61.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.62.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.62.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.62.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.63.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.63.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.63.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.64.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.64.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.64.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.65.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.65.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.65.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.66.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.66.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.66.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.67.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.67.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.67.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.68.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.68.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.68.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.69.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.69.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.69.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.7.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.7.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.7.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.70.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.70.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.70.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.71.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.71.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.71.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.72.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.72.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.72.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.73.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.73.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.73.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.74.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.74.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.74.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.75.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.75.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.75.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.76.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.76.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.76.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.77.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.77.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.77.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.78.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.78.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.78.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.79.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.79.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.79.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.8.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.8.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.8.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.80.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.80.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.80.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.81.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.81.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.81.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.82.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.82.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.82.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.83.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.83.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.83.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.84.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.84.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.84.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.85.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.85.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.85.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.86.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.86.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.86.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.87.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.87.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.87.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.88.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.88.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.88.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.89.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.89.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.89.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.9.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.9.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.9.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.90.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.90.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.90.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.91.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.91.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.91.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.92.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.92.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.92.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.93.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.93.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.93.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.94.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.94.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.94.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.95.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.95.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.95.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.96.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.96.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.96.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.97.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.97.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.97.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.98.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.98.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.98.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.99.down_proj.weight": "model-00018-of-00049.safetensors",
+ "model.layers.18.mlp.experts.99.gate_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.experts.99.up_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.mlp.gate.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.self_attn.k_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.self_attn.o_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.self_attn.q_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.18.self_attn.v_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.input_layernorm.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.0.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.0.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.0.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.1.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.1.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.1.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.10.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.10.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.10.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.100.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.100.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.100.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.101.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.101.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.101.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.102.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.102.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.102.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.103.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.103.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.103.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.104.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.104.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.104.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.105.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.105.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.105.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.106.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.106.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.106.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.107.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.107.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.107.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.108.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.108.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.108.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.109.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.109.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.109.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.11.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.11.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.11.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.110.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.110.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.110.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.111.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.111.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.111.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.112.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.112.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.112.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.113.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.113.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.113.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.114.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.114.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.114.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.115.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.115.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.115.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.116.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.116.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.116.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.117.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.117.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.117.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.118.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.118.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.118.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.119.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.119.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.119.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.12.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.12.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.12.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.120.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.120.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.120.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.121.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.121.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.121.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.122.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.122.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.122.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.123.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.123.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.123.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.124.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.124.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.124.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.125.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.125.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.125.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.126.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.126.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.126.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.127.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.127.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.127.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.13.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.13.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.13.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.14.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.14.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.14.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.15.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.15.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.15.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.16.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.16.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.16.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.17.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.17.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.17.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.18.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.18.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.18.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.19.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.19.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.19.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.2.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.2.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.2.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.20.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.20.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.20.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.21.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.21.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.21.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.22.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.22.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.22.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.23.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.23.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.23.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.24.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.24.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.24.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.25.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.25.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.25.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.26.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.26.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.26.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.27.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.27.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.27.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.28.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.28.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.28.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.29.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.29.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.29.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.3.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.3.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.3.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.30.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.30.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.30.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.31.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.31.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.31.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.32.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.32.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.32.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.33.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.33.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.33.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.34.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.34.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.34.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.35.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.35.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.35.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.36.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.36.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.36.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.37.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.37.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.37.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.38.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.38.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.38.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.39.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.39.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.39.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.4.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.4.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.4.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.40.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.40.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.40.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.41.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.41.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.41.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.42.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.42.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.42.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.43.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.43.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.43.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.44.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.44.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.44.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.45.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.45.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.45.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.46.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.46.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.46.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.47.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.47.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.47.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.48.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.48.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.48.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.49.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.49.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.49.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.5.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.5.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.5.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.50.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.50.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.50.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.51.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.51.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.51.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.52.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.52.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.52.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.53.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.53.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.53.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.54.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.54.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.54.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.55.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.55.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.55.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.56.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.56.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.56.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.57.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.57.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.57.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.58.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.58.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.58.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.59.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.59.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.59.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.6.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.6.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.6.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.60.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.60.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.60.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.61.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.61.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.61.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.62.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.62.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.62.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.63.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.63.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.63.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.64.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.64.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.64.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.65.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.65.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.65.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.66.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.66.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.66.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.67.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.67.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.67.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.68.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.68.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.68.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.69.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.69.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.69.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.7.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.7.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.7.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.70.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.70.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.70.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.71.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.71.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.71.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.72.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.72.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.72.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.73.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.73.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.73.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.74.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.74.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.74.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.75.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.75.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.75.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.76.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.76.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.76.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.77.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.77.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.77.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.78.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.78.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.78.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.79.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.79.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.79.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.8.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.8.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.8.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.80.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.80.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.80.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.81.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.81.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.81.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.82.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.82.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.82.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.83.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.83.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.83.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.84.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.84.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.84.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.85.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.85.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.85.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.86.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.86.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.86.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.87.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.87.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.87.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.88.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.88.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.88.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.89.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.89.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.89.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.9.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.9.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.9.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.90.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.90.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.90.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.91.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.91.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.91.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.92.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.92.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.92.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.93.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.93.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.93.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.94.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.94.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.94.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.95.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.95.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.95.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.96.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.96.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.96.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.97.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.97.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.97.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.98.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.98.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.98.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.99.down_proj.weight": "model-00019-of-00049.safetensors",
+ "model.layers.19.mlp.experts.99.gate_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.experts.99.up_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.mlp.gate.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.self_attn.k_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.self_attn.o_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.self_attn.q_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.19.self_attn.v_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.2.input_layernorm.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.0.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.0.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.0.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.1.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.1.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.1.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.10.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.10.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.10.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.100.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.100.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.100.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.101.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.101.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.101.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.102.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.102.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.102.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.103.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.103.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.103.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.104.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.104.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.104.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.105.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.105.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.105.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.106.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.106.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.106.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.107.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.107.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.107.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.108.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.108.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.108.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.109.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.109.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.109.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.11.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.11.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.11.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.110.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.110.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.110.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.111.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.111.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.111.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.112.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.112.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.112.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.113.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.113.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.113.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.114.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.114.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.114.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.115.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.115.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.115.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.116.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.116.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.116.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.117.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.117.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.117.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.118.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.118.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.118.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.119.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.119.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.119.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.12.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.12.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.12.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.120.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.120.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.120.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.121.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.121.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.121.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.122.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.122.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.122.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.123.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.123.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.123.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.124.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.124.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.124.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.125.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.125.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.125.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.126.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.126.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.126.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.127.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.127.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.127.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.13.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.13.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.13.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.14.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.14.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.14.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.15.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.15.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.15.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.16.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.16.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.16.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.17.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.17.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.17.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.18.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.18.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.18.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.19.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.19.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.19.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.2.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.2.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.2.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.20.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.20.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.20.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.21.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.21.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.21.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.22.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.22.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.22.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.23.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.23.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.23.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.24.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.24.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.24.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.25.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.25.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.25.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.26.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.26.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.26.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.27.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.27.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.27.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.28.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.28.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.28.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.29.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.29.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.29.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.3.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.3.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.3.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.30.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.30.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.30.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.31.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.31.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.31.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.32.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.32.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.32.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.33.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.33.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.33.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.34.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.34.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.34.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.35.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.35.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.35.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.36.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.36.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.36.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.37.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.37.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.37.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.38.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.38.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.38.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.39.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.39.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.39.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.4.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.4.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.4.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.40.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.40.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.40.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.41.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.41.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.41.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.42.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.42.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.42.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.43.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.43.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.43.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.44.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.44.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.44.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.45.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.45.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.45.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.46.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.46.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.46.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.47.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.47.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.47.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.48.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.48.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.48.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.49.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.49.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.49.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.5.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.5.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.5.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.50.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.50.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.50.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.51.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.51.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.51.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.52.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.52.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.52.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.53.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.53.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.53.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.54.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.54.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.54.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.55.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.55.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.55.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.56.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.56.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.56.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.57.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.57.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.57.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.58.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.58.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.58.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.59.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.59.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.59.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.6.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.6.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.6.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.60.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.60.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.60.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.61.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.61.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.61.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.62.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.62.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.62.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.63.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.63.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.63.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.64.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.64.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.64.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.65.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.65.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.65.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.66.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.66.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.66.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.67.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.67.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.67.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.68.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.68.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.68.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.69.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.69.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.69.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.7.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.7.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.7.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.70.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.70.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.70.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.71.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.71.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.71.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.72.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.72.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.72.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.73.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.73.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.73.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.74.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.74.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.74.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.75.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.75.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.75.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.76.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.76.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.76.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.77.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.77.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.77.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.78.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.78.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.78.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.79.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.79.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.79.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.8.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.8.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.8.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.80.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.80.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.80.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.81.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.81.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.81.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.82.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.82.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.82.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.83.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.83.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.83.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.84.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.84.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.84.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.85.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.85.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.85.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.86.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.86.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.86.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.87.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.87.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.87.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.88.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.88.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.88.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.89.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.89.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.89.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.9.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.9.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.9.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.90.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.90.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.90.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.91.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.91.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.91.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.92.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.92.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.92.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.93.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.93.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.93.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.94.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.94.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.94.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.95.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.95.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.95.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.96.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.96.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.96.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.97.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.97.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.97.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.98.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.98.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.98.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.99.down_proj.weight": "model-00002-of-00049.safetensors",
+ "model.layers.2.mlp.experts.99.gate_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.experts.99.up_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.mlp.gate.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.self_attn.k_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.self_attn.o_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.self_attn.q_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.2.self_attn.v_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.20.input_layernorm.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.0.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.0.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.0.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.1.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.1.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.1.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.10.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.10.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.10.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.100.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.100.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.100.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.101.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.101.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.101.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.102.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.102.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.102.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.103.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.103.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.103.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.104.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.104.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.104.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.105.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.105.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.105.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.106.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.106.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.106.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.107.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.107.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.107.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.108.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.108.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.108.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.109.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.109.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.109.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.11.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.11.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.11.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.110.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.110.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.110.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.111.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.111.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.111.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.112.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.112.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.112.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.113.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.113.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.113.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.114.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.114.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.114.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.115.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.115.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.115.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.116.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.116.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.116.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.117.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.117.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.117.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.118.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.118.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.118.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.119.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.119.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.119.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.12.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.12.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.12.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.120.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.120.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.120.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.121.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.121.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.121.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.122.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.122.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.122.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.123.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.123.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.123.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.124.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.124.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.124.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.125.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.125.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.125.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.126.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.126.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.126.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.127.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.127.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.127.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.13.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.13.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.13.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.14.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.14.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.14.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.15.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.15.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.15.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.16.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.16.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.16.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.17.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.17.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.17.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.18.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.18.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.18.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.19.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.19.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.19.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.2.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.2.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.2.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.20.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.20.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.20.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.21.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.21.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.21.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.22.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.22.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.22.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.23.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.23.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.23.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.24.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.24.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.24.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.25.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.25.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.25.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.26.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.26.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.26.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.27.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.27.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.27.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.28.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.28.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.28.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.29.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.29.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.29.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.3.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.3.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.3.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.30.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.30.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.30.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.31.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.31.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.31.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.32.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.32.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.32.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.33.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.33.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.33.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.34.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.34.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.34.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.35.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.35.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.35.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.36.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.36.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.36.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.37.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.37.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.37.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.38.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.38.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.38.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.39.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.39.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.39.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.4.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.4.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.4.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.40.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.40.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.40.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.41.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.41.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.41.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.42.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.42.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.42.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.43.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.43.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.43.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.44.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.44.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.44.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.45.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.45.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.45.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.46.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.46.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.46.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.47.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.47.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.47.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.48.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.48.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.48.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.49.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.49.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.49.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.5.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.5.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.5.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.50.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.50.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.50.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.51.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.51.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.51.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.52.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.52.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.52.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.53.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.53.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.53.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.54.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.54.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.54.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.55.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.55.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.55.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.56.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.56.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.56.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.57.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.57.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.57.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.58.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.58.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.58.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.59.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.59.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.59.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.6.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.6.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.6.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.60.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.60.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.60.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.61.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.61.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.61.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.62.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.62.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.62.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.63.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.63.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.63.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.64.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.64.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.64.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.65.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.65.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.65.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.66.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.66.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.66.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.67.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.67.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.67.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.68.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.68.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.68.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.69.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.69.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.69.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.7.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.7.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.7.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.70.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.70.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.70.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.71.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.71.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.71.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.72.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.72.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.72.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.73.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.73.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.73.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.74.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.74.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.74.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.75.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.75.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.75.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.76.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.76.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.76.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.77.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.77.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.77.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.78.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.78.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.78.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.79.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.79.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.79.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.8.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.8.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.8.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.80.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.80.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.80.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.81.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.81.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.81.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.82.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.82.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.82.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.83.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.83.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.83.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.84.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.84.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.84.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.85.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.85.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.85.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.86.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.86.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.86.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.87.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.87.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.87.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.88.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.88.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.88.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.89.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.89.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.89.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.9.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.9.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.9.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.90.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.90.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.90.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.91.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.91.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.91.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.92.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.92.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.92.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.93.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.93.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.93.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.94.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.94.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.94.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.95.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.95.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.95.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.96.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.96.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.96.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.97.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.97.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.97.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.98.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.98.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.98.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.99.down_proj.weight": "model-00020-of-00049.safetensors",
+ "model.layers.20.mlp.experts.99.gate_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.experts.99.up_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.mlp.gate.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.self_attn.k_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.self_attn.o_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.self_attn.q_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.20.self_attn.v_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.input_layernorm.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.0.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.0.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.0.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.1.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.1.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.1.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.10.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.10.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.10.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.100.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.100.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.100.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.101.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.101.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.101.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.102.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.102.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.102.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.103.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.103.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.103.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.104.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.104.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.104.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.105.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.105.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.105.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.106.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.106.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.106.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.107.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.107.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.107.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.108.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.108.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.108.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.109.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.109.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.109.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.11.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.11.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.11.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.110.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.110.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.110.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.111.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.111.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.111.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.112.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.112.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.112.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.113.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.113.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.113.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.114.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.114.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.114.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.115.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.115.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.115.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.116.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.116.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.116.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.117.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.117.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.117.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.118.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.118.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.118.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.119.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.119.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.119.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.12.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.12.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.12.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.120.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.120.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.120.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.121.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.121.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.121.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.122.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.122.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.122.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.123.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.123.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.123.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.124.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.124.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.124.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.125.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.125.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.125.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.126.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.126.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.126.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.127.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.127.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.127.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.13.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.13.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.13.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.14.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.14.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.14.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.15.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.15.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.15.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.16.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.16.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.16.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.17.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.17.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.17.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.18.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.18.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.18.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.19.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.19.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.19.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.2.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.2.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.2.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.20.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.20.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.20.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.21.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.21.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.21.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.22.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.22.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.22.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.23.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.23.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.23.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.24.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.24.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.24.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.25.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.25.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.25.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.26.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.26.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.26.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.27.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.27.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.27.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.28.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.28.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.28.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.29.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.29.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.29.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.3.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.3.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.3.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.30.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.30.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.30.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.31.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.31.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.31.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.32.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.32.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.32.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.33.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.33.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.33.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.34.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.34.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.34.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.35.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.35.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.35.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.36.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.36.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.36.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.37.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.37.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.37.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.38.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.38.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.38.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.39.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.39.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.39.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.4.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.4.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.4.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.40.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.40.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.40.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.41.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.41.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.41.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.42.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.42.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.42.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.43.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.43.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.43.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.44.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.44.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.44.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.45.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.45.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.45.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.46.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.46.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.46.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.47.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.47.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.47.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.48.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.48.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.48.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.49.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.49.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.49.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.5.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.5.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.5.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.50.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.50.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.50.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.51.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.51.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.51.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.52.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.52.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.52.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.53.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.53.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.53.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.54.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.54.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.54.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.55.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.55.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.55.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.56.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.56.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.56.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.57.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.57.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.57.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.58.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.58.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.58.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.59.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.59.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.59.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.6.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.6.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.6.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.60.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.60.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.60.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.61.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.61.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.61.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.62.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.62.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.62.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.63.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.63.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.63.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.64.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.64.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.64.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.65.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.65.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.65.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.66.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.66.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.66.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.67.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.67.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.67.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.68.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.68.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.68.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.69.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.69.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.69.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.7.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.7.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.7.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.70.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.70.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.70.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.71.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.71.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.71.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.72.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.72.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.72.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.73.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.73.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.73.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.74.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.74.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.74.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.75.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.75.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.75.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.76.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.76.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.76.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.77.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.77.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.77.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.78.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.78.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.78.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.79.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.79.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.79.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.8.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.8.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.8.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.80.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.80.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.80.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.81.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.81.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.81.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.82.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.82.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.82.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.83.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.83.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.83.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.84.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.84.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.84.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.85.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.85.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.85.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.86.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.86.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.86.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.87.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.87.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.87.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.88.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.88.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.88.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.89.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.89.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.89.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.9.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.9.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.9.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.90.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.90.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.90.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.91.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.91.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.91.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.92.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.92.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.92.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.93.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.93.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.93.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.94.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.94.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.94.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.95.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.95.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.95.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.96.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.96.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.96.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.97.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.97.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.97.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.98.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.98.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.98.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.99.down_proj.weight": "model-00021-of-00049.safetensors",
+ "model.layers.21.mlp.experts.99.gate_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.experts.99.up_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.mlp.gate.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.self_attn.k_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.self_attn.o_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.self_attn.q_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.21.self_attn.v_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.input_layernorm.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.0.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.0.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.0.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.1.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.1.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.1.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.10.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.10.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.10.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.100.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.100.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.100.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.101.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.101.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.101.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.102.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.102.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.102.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.103.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.103.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.103.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.104.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.104.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.104.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.105.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.105.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.105.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.106.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.106.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.106.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.107.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.107.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.107.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.108.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.108.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.108.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.109.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.109.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.109.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.11.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.11.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.11.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.110.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.110.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.110.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.111.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.111.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.111.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.112.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.112.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.112.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.113.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.113.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.113.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.114.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.114.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.114.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.115.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.115.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.115.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.116.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.116.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.116.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.117.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.117.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.117.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.118.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.118.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.118.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.119.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.119.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.119.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.12.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.12.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.12.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.120.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.120.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.120.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.121.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.121.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.121.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.122.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.122.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.122.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.123.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.123.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.123.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.124.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.124.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.124.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.125.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.125.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.125.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.126.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.126.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.126.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.127.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.127.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.127.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.13.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.13.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.13.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.14.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.14.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.14.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.15.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.15.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.15.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.16.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.16.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.16.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.17.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.17.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.17.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.18.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.18.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.18.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.19.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.19.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.19.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.2.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.2.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.2.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.20.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.20.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.20.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.21.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.21.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.21.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.22.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.22.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.22.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.23.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.23.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.23.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.24.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.24.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.24.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.25.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.25.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.25.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.26.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.26.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.26.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.27.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.27.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.27.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.28.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.28.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.28.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.29.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.29.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.29.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.3.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.3.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.3.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.30.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.30.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.30.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.31.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.31.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.31.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.32.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.32.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.32.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.33.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.33.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.33.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.34.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.34.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.34.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.35.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.35.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.35.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.36.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.36.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.36.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.37.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.37.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.37.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.38.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.38.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.38.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.39.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.39.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.39.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.4.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.4.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.4.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.40.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.40.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.40.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.41.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.41.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.41.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.42.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.42.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.42.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.43.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.43.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.43.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.44.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.44.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.44.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.45.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.45.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.45.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.46.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.46.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.46.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.47.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.47.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.47.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.48.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.48.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.48.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.49.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.49.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.49.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.5.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.5.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.5.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.50.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.50.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.50.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.51.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.51.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.51.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.52.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.52.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.52.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.53.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.53.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.53.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.54.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.54.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.54.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.55.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.55.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.55.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.56.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.56.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.56.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.57.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.57.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.57.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.58.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.58.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.58.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.59.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.59.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.59.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.6.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.6.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.6.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.60.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.60.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.60.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.61.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.61.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.61.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.62.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.62.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.62.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.63.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.63.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.63.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.64.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.64.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.64.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.65.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.65.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.65.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.66.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.66.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.66.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.67.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.67.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.67.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.68.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.68.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.68.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.69.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.69.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.69.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.7.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.7.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.7.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.70.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.70.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.70.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.71.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.71.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.71.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.72.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.72.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.72.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.73.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.73.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.73.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.74.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.74.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.74.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.75.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.75.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.75.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.76.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.76.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.76.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.77.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.77.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.77.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.78.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.78.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.78.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.79.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.79.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.79.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.8.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.8.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.8.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.80.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.80.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.80.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.81.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.81.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.81.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.82.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.82.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.82.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.83.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.83.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.83.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.84.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.84.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.84.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.85.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.85.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.85.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.86.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.86.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.86.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.87.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.87.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.87.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.88.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.88.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.88.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.89.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.89.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.89.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.9.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.9.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.9.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.90.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.90.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.90.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.91.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.91.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.91.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.92.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.92.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.92.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.93.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.93.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.93.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.94.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.94.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.94.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.95.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.95.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.95.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.96.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.96.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.96.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.97.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.97.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.97.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.98.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.98.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.98.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.99.down_proj.weight": "model-00022-of-00049.safetensors",
+ "model.layers.22.mlp.experts.99.gate_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.experts.99.up_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.mlp.gate.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.self_attn.k_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.self_attn.o_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.self_attn.q_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.22.self_attn.v_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.input_layernorm.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.0.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.0.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.0.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.1.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.1.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.1.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.10.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.10.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.10.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.100.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.100.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.100.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.101.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.101.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.101.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.102.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.102.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.102.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.103.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.103.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.103.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.104.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.104.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.104.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.105.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.105.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.105.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.106.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.106.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.106.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.107.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.107.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.107.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.108.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.108.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.108.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.109.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.109.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.109.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.11.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.11.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.11.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.110.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.110.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.110.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.111.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.111.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.111.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.112.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.112.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.112.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.113.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.113.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.113.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.114.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.114.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.114.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.115.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.115.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.115.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.116.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.116.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.116.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.117.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.117.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.117.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.118.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.118.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.118.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.119.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.119.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.119.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.12.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.12.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.12.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.120.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.120.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.120.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.121.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.121.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.121.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.122.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.122.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.122.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.123.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.123.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.123.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.124.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.124.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.124.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.125.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.125.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.125.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.126.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.126.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.126.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.127.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.127.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.127.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.13.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.13.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.13.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.14.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.14.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.14.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.15.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.15.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.15.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.16.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.16.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.16.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.17.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.17.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.17.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.18.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.18.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.18.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.19.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.19.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.19.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.2.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.2.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.2.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.20.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.20.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.20.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.21.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.21.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.21.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.22.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.22.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.22.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.23.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.23.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.23.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.24.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.24.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.24.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.25.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.25.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.25.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.26.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.26.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.26.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.27.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.27.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.27.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.28.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.28.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.28.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.29.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.29.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.29.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.3.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.3.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.3.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.30.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.30.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.30.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.31.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.31.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.31.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.32.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.32.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.32.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.33.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.33.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.33.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.34.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.34.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.34.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.35.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.35.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.35.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.36.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.36.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.36.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.37.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.37.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.37.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.38.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.38.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.38.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.39.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.39.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.39.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.4.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.4.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.4.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.40.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.40.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.40.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.41.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.41.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.41.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.42.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.42.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.42.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.43.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.43.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.43.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.44.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.44.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.44.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.45.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.45.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.45.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.46.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.46.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.46.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.47.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.47.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.47.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.48.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.48.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.48.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.49.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.49.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.49.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.5.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.5.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.5.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.50.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.50.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.50.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.51.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.51.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.51.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.52.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.52.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.52.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.53.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.53.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.53.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.54.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.54.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.54.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.55.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.55.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.55.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.56.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.56.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.56.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.57.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.57.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.57.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.58.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.58.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.58.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.59.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.59.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.59.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.6.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.6.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.6.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.60.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.60.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.60.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.61.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.61.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.61.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.62.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.62.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.62.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.63.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.63.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.63.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.64.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.64.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.64.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.65.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.65.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.65.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.66.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.66.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.66.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.67.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.67.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.67.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.68.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.68.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.68.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.69.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.69.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.69.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.7.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.7.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.7.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.70.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.70.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.70.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.71.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.71.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.71.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.72.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.72.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.72.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.73.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.73.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.73.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.74.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.74.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.74.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.75.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.75.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.75.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.76.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.76.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.76.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.77.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.77.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.77.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.78.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.78.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.78.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.79.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.79.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.79.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.8.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.8.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.8.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.80.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.80.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.80.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.81.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.81.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.81.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.82.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.82.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.82.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.83.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.83.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.83.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.84.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.84.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.84.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.85.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.85.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.85.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.86.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.86.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.86.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.87.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.87.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.87.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.88.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.88.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.88.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.89.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.89.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.89.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.9.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.9.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.9.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.90.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.90.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.90.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.91.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.91.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.91.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.92.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.92.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.92.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.93.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.93.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.93.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.94.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.94.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.94.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.95.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.95.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.95.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.96.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.96.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.96.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.97.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.97.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.97.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.98.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.98.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.98.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.99.down_proj.weight": "model-00023-of-00049.safetensors",
+ "model.layers.23.mlp.experts.99.gate_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.experts.99.up_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.mlp.gate.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.self_attn.k_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.self_attn.o_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.self_attn.q_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.23.self_attn.v_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.input_layernorm.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.0.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.0.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.0.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.1.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.1.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.1.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.10.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.10.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.10.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.100.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.100.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.100.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.101.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.101.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.101.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.102.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.102.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.102.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.103.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.103.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.103.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.104.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.104.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.104.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.105.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.105.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.105.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.106.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.106.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.106.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.107.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.107.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.107.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.108.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.108.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.108.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.109.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.109.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.109.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.11.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.11.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.11.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.110.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.110.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.110.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.111.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.111.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.111.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.112.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.112.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.112.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.113.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.113.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.113.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.114.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.114.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.114.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.115.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.115.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.115.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.116.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.116.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.116.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.117.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.117.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.117.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.118.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.118.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.118.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.119.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.119.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.119.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.12.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.12.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.12.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.120.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.120.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.120.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.121.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.121.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.121.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.122.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.122.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.122.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.123.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.123.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.123.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.124.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.124.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.124.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.125.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.125.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.125.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.126.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.126.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.126.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.127.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.127.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.127.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.13.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.13.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.13.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.14.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.14.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.14.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.15.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.15.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.15.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.16.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.16.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.16.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.17.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.17.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.17.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.18.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.18.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.18.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.19.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.19.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.19.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.2.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.2.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.2.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.20.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.20.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.20.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.21.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.21.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.21.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.22.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.22.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.22.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.23.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.23.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.23.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.24.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.24.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.24.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.25.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.25.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.25.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.26.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.26.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.26.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.27.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.27.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.27.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.28.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.28.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.28.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.29.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.29.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.29.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.3.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.3.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.3.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.30.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.30.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.30.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.31.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.31.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.31.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.32.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.32.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.32.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.33.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.33.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.33.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.34.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.34.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.34.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.35.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.35.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.35.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.36.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.36.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.36.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.37.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.37.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.37.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.38.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.38.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.38.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.39.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.39.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.39.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.4.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.4.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.4.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.40.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.40.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.40.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.41.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.41.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.41.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.42.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.42.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.42.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.43.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.43.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.43.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.44.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.44.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.44.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.45.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.45.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.45.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.46.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.46.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.46.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.47.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.47.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.47.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.48.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.48.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.48.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.49.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.49.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.49.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.5.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.5.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.5.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.50.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.50.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.50.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.51.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.51.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.51.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.52.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.52.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.52.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.53.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.53.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.53.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.54.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.54.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.54.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.55.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.55.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.55.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.56.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.56.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.56.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.57.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.57.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.57.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.58.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.58.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.58.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.59.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.59.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.59.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.6.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.6.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.6.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.60.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.60.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.60.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.61.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.61.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.61.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.62.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.62.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.62.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.63.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.63.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.63.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.64.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.64.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.64.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.65.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.65.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.65.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.66.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.66.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.66.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.67.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.67.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.67.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.68.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.68.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.68.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.69.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.69.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.69.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.7.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.7.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.7.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.70.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.70.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.70.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.71.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.71.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.71.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.72.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.72.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.72.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.73.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.73.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.73.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.74.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.74.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.74.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.75.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.75.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.75.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.76.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.76.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.76.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.77.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.77.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.77.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.78.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.78.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.78.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.79.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.79.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.79.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.8.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.8.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.8.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.80.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.80.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.80.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.81.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.81.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.81.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.82.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.82.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.82.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.83.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.83.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.83.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.84.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.84.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.84.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.85.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.85.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.85.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.86.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.86.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.86.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.87.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.87.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.87.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.88.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.88.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.88.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.89.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.89.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.89.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.9.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.9.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.9.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.90.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.90.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.90.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.91.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.91.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.91.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.92.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.92.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.92.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.93.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.93.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.93.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.94.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.94.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.94.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.95.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.95.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.95.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.96.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.96.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.96.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.97.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.97.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.97.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.98.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.98.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.98.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.99.down_proj.weight": "model-00024-of-00049.safetensors",
+ "model.layers.24.mlp.experts.99.gate_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.experts.99.up_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.mlp.gate.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.self_attn.k_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.self_attn.o_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.self_attn.q_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.24.self_attn.v_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.input_layernorm.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.0.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.0.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.0.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.1.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.1.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.1.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.10.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.10.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.10.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.100.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.100.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.100.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.101.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.101.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.101.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.102.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.102.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.102.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.103.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.103.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.103.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.104.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.104.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.104.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.105.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.105.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.105.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.106.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.106.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.106.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.107.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.107.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.107.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.108.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.108.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.108.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.109.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.109.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.109.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.11.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.11.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.11.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.110.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.110.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.110.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.111.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.111.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.111.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.112.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.112.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.112.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.113.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.113.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.113.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.114.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.114.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.114.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.115.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.115.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.115.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.116.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.116.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.116.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.117.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.117.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.117.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.118.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.118.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.118.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.119.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.119.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.119.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.12.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.12.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.12.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.120.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.120.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.120.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.121.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.121.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.121.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.122.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.122.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.122.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.123.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.123.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.123.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.124.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.124.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.124.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.125.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.125.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.125.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.126.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.126.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.126.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.127.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.127.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.127.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.13.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.13.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.13.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.14.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.14.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.14.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.15.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.15.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.15.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.16.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.16.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.16.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.17.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.17.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.17.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.18.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.18.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.18.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.19.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.19.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.19.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.2.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.2.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.2.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.20.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.20.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.20.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.21.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.21.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.21.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.22.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.22.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.22.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.23.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.23.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.23.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.24.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.24.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.24.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.25.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.25.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.25.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.26.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.26.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.26.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.27.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.27.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.27.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.28.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.28.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.28.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.29.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.29.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.29.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.3.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.3.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.3.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.30.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.30.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.30.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.31.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.31.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.31.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.32.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.32.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.32.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.33.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.33.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.33.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.34.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.34.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.34.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.35.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.35.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.35.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.36.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.36.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.36.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.37.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.37.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.37.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.38.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.38.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.38.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.39.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.39.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.39.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.4.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.4.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.4.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.40.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.40.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.40.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.41.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.41.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.41.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.42.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.42.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.42.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.43.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.43.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.43.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.44.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.44.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.44.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.45.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.45.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.45.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.46.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.46.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.46.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.47.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.47.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.47.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.48.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.48.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.48.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.49.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.49.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.49.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.5.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.5.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.5.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.50.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.50.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.50.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.51.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.51.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.51.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.52.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.52.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.52.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.53.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.53.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.53.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.54.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.54.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.54.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.55.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.55.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.55.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.56.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.56.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.56.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.57.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.57.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.57.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.58.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.58.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.58.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.59.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.59.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.59.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.6.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.6.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.6.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.60.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.60.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.60.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.61.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.61.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.61.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.62.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.62.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.62.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.63.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.63.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.63.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.64.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.64.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.64.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.65.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.65.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.65.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.66.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.66.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.66.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.67.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.67.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.67.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.68.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.68.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.68.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.69.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.69.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.69.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.7.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.7.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.7.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.70.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.70.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.70.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.71.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.71.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.71.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.72.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.72.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.72.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.73.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.73.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.73.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.74.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.74.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.74.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.75.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.75.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.75.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.76.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.76.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.76.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.77.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.77.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.77.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.78.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.78.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.78.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.79.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.79.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.79.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.8.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.8.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.8.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.80.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.80.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.80.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.81.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.81.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.81.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.82.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.82.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.82.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.83.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.83.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.83.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.84.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.84.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.84.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.85.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.85.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.85.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.86.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.86.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.86.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.87.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.87.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.87.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.88.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.88.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.88.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.89.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.89.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.89.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.9.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.9.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.9.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.90.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.90.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.90.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.91.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.91.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.91.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.92.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.92.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.92.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.93.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.93.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.93.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.94.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.94.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.94.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.95.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.95.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.95.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.96.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.96.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.96.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.97.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.97.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.97.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.98.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.98.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.98.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.99.down_proj.weight": "model-00025-of-00049.safetensors",
+ "model.layers.25.mlp.experts.99.gate_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.experts.99.up_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.mlp.gate.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.self_attn.k_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.self_attn.o_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.self_attn.q_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.25.self_attn.v_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.input_layernorm.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.0.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.0.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.0.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.1.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.1.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.1.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.10.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.10.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.10.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.100.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.100.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.100.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.101.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.101.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.101.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.102.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.102.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.102.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.103.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.103.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.103.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.104.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.104.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.104.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.105.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.105.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.105.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.106.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.106.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.106.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.107.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.107.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.107.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.108.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.108.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.108.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.109.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.109.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.109.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.11.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.11.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.11.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.110.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.110.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.110.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.111.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.111.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.111.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.112.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.112.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.112.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.113.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.113.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.113.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.114.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.114.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.114.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.115.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.115.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.115.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.116.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.116.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.116.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.117.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.117.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.117.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.118.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.118.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.118.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.119.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.119.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.119.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.12.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.12.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.12.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.120.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.120.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.120.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.121.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.121.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.121.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.122.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.122.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.122.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.123.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.123.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.123.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.124.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.124.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.124.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.125.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.125.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.125.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.126.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.126.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.126.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.127.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.127.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.127.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.13.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.13.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.13.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.14.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.14.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.14.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.15.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.15.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.15.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.16.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.16.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.16.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.17.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.17.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.17.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.18.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.18.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.18.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.19.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.19.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.19.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.2.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.2.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.2.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.20.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.20.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.20.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.21.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.21.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.21.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.22.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.22.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.22.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.23.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.23.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.23.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.24.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.24.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.24.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.25.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.25.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.25.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.26.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.26.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.26.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.27.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.27.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.27.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.28.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.28.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.28.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.29.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.29.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.29.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.3.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.3.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.3.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.30.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.30.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.30.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.31.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.31.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.31.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.32.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.32.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.32.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.33.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.33.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.33.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.34.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.34.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.34.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.35.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.35.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.35.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.36.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.36.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.36.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.37.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.37.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.37.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.38.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.38.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.38.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.39.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.39.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.39.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.4.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.4.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.4.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.40.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.40.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.40.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.41.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.41.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.41.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.42.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.42.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.42.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.43.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.43.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.43.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.44.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.44.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.44.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.45.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.45.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.45.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.46.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.46.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.46.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.47.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.47.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.47.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.48.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.48.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.48.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.49.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.49.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.49.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.5.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.5.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.5.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.50.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.50.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.50.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.51.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.51.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.51.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.52.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.52.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.52.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.53.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.53.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.53.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.54.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.54.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.54.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.55.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.55.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.55.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.56.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.56.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.56.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.57.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.57.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.57.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.58.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.58.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.58.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.59.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.59.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.59.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.6.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.6.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.6.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.60.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.60.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.60.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.61.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.61.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.61.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.62.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.62.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.62.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.63.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.63.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.63.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.64.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.64.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.64.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.65.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.65.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.65.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.66.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.66.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.66.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.67.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.67.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.67.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.68.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.68.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.68.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.69.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.69.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.69.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.7.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.7.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.7.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.70.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.70.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.70.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.71.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.71.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.71.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.72.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.72.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.72.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.73.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.73.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.73.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.74.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.74.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.74.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.75.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.75.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.75.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.76.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.76.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.76.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.77.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.77.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.77.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.78.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.78.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.78.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.79.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.79.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.79.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.8.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.8.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.8.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.80.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.80.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.80.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.81.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.81.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.81.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.82.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.82.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.82.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.83.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.83.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.83.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.84.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.84.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.84.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.85.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.85.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.85.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.86.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.86.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.86.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.87.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.87.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.87.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.88.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.88.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.88.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.89.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.89.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.89.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.9.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.9.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.9.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.90.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.90.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.90.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.91.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.91.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.91.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.92.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.92.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.92.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.93.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.93.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.93.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.94.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.94.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.94.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.95.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.95.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.95.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.96.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.96.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.96.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.97.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.97.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.97.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.98.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.98.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.98.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.99.down_proj.weight": "model-00026-of-00049.safetensors",
+ "model.layers.26.mlp.experts.99.gate_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.experts.99.up_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.mlp.gate.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.self_attn.k_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.self_attn.o_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.self_attn.q_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.26.self_attn.v_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.input_layernorm.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.0.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.0.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.0.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.1.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.1.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.1.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.10.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.10.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.10.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.100.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.100.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.100.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.101.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.101.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.101.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.102.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.102.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.102.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.103.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.103.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.103.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.104.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.104.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.104.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.105.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.105.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.105.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.106.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.106.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.106.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.107.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.107.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.107.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.108.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.108.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.108.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.109.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.109.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.109.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.11.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.11.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.11.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.110.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.110.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.110.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.111.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.111.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.111.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.112.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.112.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.112.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.113.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.113.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.113.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.114.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.114.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.114.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.115.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.115.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.115.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.116.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.116.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.116.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.117.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.117.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.117.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.118.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.118.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.118.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.119.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.119.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.119.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.12.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.12.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.12.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.120.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.120.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.120.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.121.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.121.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.121.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.122.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.122.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.122.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.123.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.123.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.123.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.124.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.124.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.124.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.125.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.125.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.125.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.126.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.126.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.126.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.127.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.127.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.127.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.13.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.13.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.13.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.14.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.14.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.14.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.15.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.15.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.15.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.16.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.16.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.16.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.17.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.17.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.17.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.18.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.18.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.18.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.19.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.19.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.19.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.2.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.2.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.2.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.20.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.20.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.20.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.21.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.21.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.21.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.22.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.22.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.22.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.23.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.23.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.23.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.24.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.24.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.24.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.25.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.25.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.25.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.26.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.26.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.26.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.27.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.27.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.27.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.28.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.28.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.28.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.29.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.29.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.29.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.3.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.3.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.3.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.30.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.30.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.30.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.31.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.31.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.31.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.32.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.32.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.32.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.33.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.33.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.33.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.34.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.34.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.34.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.35.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.35.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.35.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.36.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.36.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.36.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.37.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.37.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.37.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.38.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.38.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.38.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.39.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.39.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.39.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.4.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.4.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.4.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.40.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.40.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.40.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.41.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.41.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.41.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.42.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.42.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.42.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.43.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.43.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.43.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.44.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.44.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.44.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.45.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.45.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.45.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.46.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.46.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.46.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.47.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.47.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.47.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.48.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.48.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.48.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.49.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.49.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.49.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.5.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.5.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.5.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.50.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.50.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.50.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.51.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.51.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.51.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.52.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.52.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.52.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.53.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.53.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.53.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.54.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.54.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.54.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.55.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.55.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.55.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.56.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.56.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.56.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.57.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.57.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.57.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.58.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.58.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.58.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.59.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.59.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.59.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.6.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.6.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.6.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.60.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.60.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.60.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.61.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.61.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.61.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.62.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.62.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.62.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.63.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.63.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.63.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.64.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.64.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.64.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.65.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.65.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.65.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.66.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.66.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.66.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.67.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.67.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.67.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.68.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.68.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.68.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.69.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.69.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.69.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.7.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.7.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.7.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.70.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.70.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.70.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.71.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.71.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.71.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.72.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.72.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.72.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.73.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.73.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.73.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.74.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.74.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.74.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.75.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.75.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.75.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.76.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.76.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.76.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.77.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.77.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.77.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.78.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.78.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.78.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.79.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.79.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.79.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.8.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.8.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.8.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.80.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.80.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.80.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.81.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.81.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.81.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.82.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.82.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.82.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.83.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.83.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.83.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.84.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.84.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.84.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.85.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.85.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.85.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.86.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.86.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.86.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.87.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.87.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.87.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.88.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.88.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.88.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.89.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.89.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.89.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.9.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.9.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.9.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.90.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.90.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.90.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.91.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.91.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.91.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.92.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.92.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.92.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.93.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.93.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.93.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.94.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.94.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.94.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.95.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.95.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.95.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.96.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.96.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.96.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.97.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.97.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.97.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.98.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.98.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.98.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.99.down_proj.weight": "model-00027-of-00049.safetensors",
+ "model.layers.27.mlp.experts.99.gate_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.experts.99.up_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.mlp.gate.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.self_attn.k_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.self_attn.o_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.self_attn.q_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.27.self_attn.v_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.input_layernorm.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.0.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.0.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.0.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.1.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.1.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.1.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.10.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.10.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.10.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.100.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.100.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.100.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.101.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.101.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.101.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.102.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.102.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.102.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.103.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.103.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.103.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.104.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.104.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.104.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.105.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.105.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.105.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.106.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.106.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.106.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.107.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.107.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.107.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.108.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.108.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.108.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.109.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.109.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.109.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.11.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.11.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.11.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.110.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.110.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.110.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.111.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.111.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.111.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.112.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.112.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.112.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.113.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.113.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.113.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.114.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.114.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.114.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.115.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.115.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.115.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.116.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.116.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.116.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.117.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.117.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.117.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.118.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.118.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.118.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.119.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.119.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.119.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.12.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.12.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.12.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.120.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.120.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.120.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.121.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.121.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.121.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.122.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.122.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.122.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.123.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.123.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.123.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.124.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.124.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.124.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.125.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.125.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.125.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.126.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.126.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.126.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.127.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.127.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.127.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.13.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.13.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.13.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.14.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.14.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.14.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.15.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.15.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.15.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.16.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.16.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.16.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.17.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.17.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.17.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.18.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.18.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.18.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.19.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.19.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.19.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.2.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.2.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.2.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.20.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.20.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.20.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.21.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.21.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.21.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.22.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.22.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.22.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.23.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.23.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.23.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.24.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.24.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.24.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.25.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.25.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.25.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.26.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.26.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.26.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.27.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.27.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.27.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.28.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.28.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.28.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.29.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.29.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.29.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.3.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.3.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.3.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.30.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.30.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.30.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.31.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.31.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.31.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.32.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.32.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.32.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.33.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.33.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.33.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.34.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.34.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.34.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.35.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.35.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.35.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.36.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.36.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.36.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.37.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.37.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.37.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.38.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.38.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.38.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.39.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.39.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.39.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.4.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.4.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.4.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.40.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.40.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.40.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.41.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.41.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.41.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.42.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.42.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.42.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.43.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.43.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.43.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.44.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.44.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.44.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.45.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.45.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.45.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.46.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.46.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.46.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.47.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.47.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.47.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.48.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.48.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.48.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.49.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.49.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.49.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.5.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.5.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.5.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.50.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.50.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.50.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.51.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.51.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.51.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.52.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.52.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.52.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.53.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.53.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.53.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.54.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.54.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.54.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.55.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.55.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.55.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.56.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.56.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.56.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.57.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.57.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.57.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.58.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.58.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.58.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.59.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.59.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.59.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.6.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.6.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.6.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.60.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.60.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.60.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.61.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.61.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.61.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.62.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.62.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.62.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.63.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.63.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.63.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.64.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.64.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.64.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.65.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.65.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.65.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.66.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.66.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.66.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.67.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.67.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.67.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.68.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.68.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.68.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.69.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.69.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.69.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.7.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.7.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.7.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.70.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.70.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.70.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.71.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.71.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.71.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.72.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.72.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.72.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.73.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.73.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.73.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.74.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.74.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.74.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.75.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.75.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.75.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.76.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.76.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.76.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.77.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.77.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.77.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.78.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.78.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.78.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.79.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.79.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.79.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.8.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.8.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.8.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.80.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.80.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.80.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.81.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.81.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.81.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.82.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.82.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.82.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.83.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.83.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.83.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.84.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.84.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.84.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.85.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.85.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.85.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.86.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.86.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.86.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.87.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.87.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.87.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.88.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.88.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.88.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.89.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.89.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.89.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.9.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.9.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.9.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.90.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.90.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.90.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.91.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.91.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.91.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.92.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.92.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.92.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.93.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.93.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.93.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.94.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.94.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.94.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.95.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.95.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.95.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.96.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.96.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.96.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.97.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.97.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.97.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.98.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.98.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.98.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.99.down_proj.weight": "model-00028-of-00049.safetensors",
+ "model.layers.28.mlp.experts.99.gate_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.experts.99.up_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.mlp.gate.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.self_attn.k_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.self_attn.o_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.self_attn.q_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.28.self_attn.v_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.input_layernorm.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.0.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.0.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.0.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.1.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.1.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.1.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.10.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.10.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.10.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.100.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.100.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.100.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.101.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.101.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.101.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.102.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.102.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.102.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.103.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.103.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.103.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.104.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.104.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.104.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.105.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.105.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.105.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.106.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.106.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.106.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.107.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.107.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.107.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.108.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.108.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.108.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.109.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.109.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.109.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.11.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.11.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.11.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.110.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.110.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.110.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.111.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.111.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.111.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.112.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.112.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.112.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.113.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.113.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.113.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.114.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.114.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.114.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.115.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.115.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.115.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.116.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.116.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.116.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.117.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.117.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.117.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.118.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.118.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.118.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.119.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.119.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.119.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.12.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.12.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.12.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.120.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.120.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.120.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.121.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.121.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.121.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.122.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.122.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.122.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.123.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.123.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.123.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.124.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.124.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.124.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.125.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.125.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.125.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.126.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.126.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.126.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.127.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.127.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.127.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.13.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.13.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.13.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.14.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.14.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.14.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.15.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.15.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.15.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.16.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.16.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.16.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.17.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.17.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.17.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.18.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.18.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.18.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.19.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.19.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.19.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.2.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.2.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.2.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.20.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.20.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.20.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.21.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.21.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.21.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.22.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.22.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.22.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.23.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.23.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.23.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.24.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.24.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.24.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.25.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.25.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.25.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.26.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.26.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.26.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.27.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.27.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.27.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.28.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.28.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.28.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.29.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.29.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.29.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.3.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.3.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.3.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.30.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.30.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.30.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.31.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.31.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.31.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.32.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.32.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.32.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.33.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.33.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.33.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.34.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.34.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.34.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.35.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.35.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.35.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.36.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.36.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.36.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.37.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.37.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.37.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.38.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.38.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.38.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.39.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.39.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.39.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.4.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.4.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.4.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.40.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.40.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.40.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.41.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.41.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.41.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.42.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.42.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.42.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.43.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.43.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.43.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.44.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.44.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.44.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.45.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.45.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.45.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.46.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.46.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.46.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.47.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.47.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.47.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.48.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.48.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.48.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.49.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.49.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.49.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.5.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.5.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.5.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.50.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.50.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.50.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.51.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.51.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.51.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.52.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.52.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.52.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.53.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.53.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.53.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.54.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.54.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.54.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.55.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.55.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.55.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.56.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.56.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.56.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.57.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.57.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.57.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.58.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.58.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.58.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.59.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.59.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.59.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.6.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.6.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.6.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.60.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.60.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.60.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.61.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.61.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.61.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.62.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.62.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.62.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.63.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.63.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.63.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.64.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.64.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.64.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.65.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.65.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.65.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.66.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.66.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.66.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.67.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.67.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.67.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.68.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.68.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.68.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.69.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.69.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.69.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.7.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.7.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.7.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.70.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.70.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.70.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.71.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.71.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.71.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.72.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.72.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.72.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.73.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.73.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.73.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.74.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.74.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.74.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.75.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.75.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.75.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.76.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.76.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.76.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.77.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.77.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.77.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.78.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.78.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.78.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.79.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.79.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.79.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.8.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.8.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.8.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.80.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.80.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.80.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.81.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.81.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.81.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.82.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.82.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.82.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.83.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.83.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.83.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.84.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.84.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.84.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.85.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.85.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.85.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.86.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.86.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.86.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.87.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.87.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.87.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.88.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.88.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.88.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.89.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.89.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.89.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.9.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.9.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.9.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.90.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.90.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.90.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.91.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.91.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.91.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.92.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.92.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.92.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.93.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.93.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.93.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.94.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.94.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.94.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.95.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.95.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.95.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.96.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.96.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.96.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.97.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.97.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.97.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.98.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.98.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.98.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.99.down_proj.weight": "model-00029-of-00049.safetensors",
+ "model.layers.29.mlp.experts.99.gate_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.experts.99.up_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.mlp.gate.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.self_attn.k_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.self_attn.o_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.self_attn.q_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.29.self_attn.v_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.3.input_layernorm.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.0.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.0.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.0.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.1.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.1.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.1.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.10.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.10.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.10.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.100.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.100.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.100.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.101.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.101.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.101.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.102.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.102.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.102.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.103.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.103.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.103.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.104.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.104.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.104.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.105.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.105.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.105.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.106.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.106.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.106.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.107.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.107.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.107.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.108.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.108.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.108.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.109.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.109.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.109.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.11.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.11.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.11.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.110.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.110.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.110.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.111.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.111.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.111.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.112.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.112.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.112.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.113.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.113.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.113.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.114.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.114.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.114.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.115.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.115.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.115.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.116.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.116.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.116.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.117.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.117.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.117.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.118.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.118.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.118.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.119.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.119.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.119.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.12.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.12.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.12.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.120.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.120.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.120.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.121.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.121.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.121.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.122.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.122.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.122.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.123.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.123.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.123.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.124.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.124.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.124.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.125.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.125.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.125.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.126.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.126.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.126.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.127.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.127.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.127.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.13.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.13.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.13.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.14.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.14.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.14.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.15.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.15.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.15.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.16.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.16.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.16.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.17.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.17.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.17.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.18.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.18.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.18.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.19.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.19.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.19.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.2.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.2.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.2.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.20.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.20.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.20.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.21.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.21.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.21.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.22.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.22.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.22.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.23.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.23.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.23.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.24.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.24.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.24.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.25.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.25.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.25.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.26.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.26.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.26.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.27.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.27.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.27.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.28.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.28.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.28.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.29.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.29.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.29.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.3.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.3.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.3.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.30.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.30.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.30.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.31.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.31.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.31.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.32.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.32.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.32.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.33.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.33.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.33.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.34.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.34.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.34.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.35.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.35.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.35.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.36.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.36.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.36.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.37.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.37.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.37.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.38.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.38.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.38.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.39.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.39.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.39.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.4.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.4.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.4.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.40.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.40.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.40.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.41.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.41.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.41.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.42.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.42.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.42.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.43.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.43.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.43.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.44.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.44.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.44.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.45.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.45.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.45.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.46.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.46.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.46.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.47.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.47.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.47.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.48.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.48.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.48.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.49.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.49.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.49.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.5.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.5.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.5.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.50.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.50.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.50.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.51.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.51.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.51.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.52.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.52.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.52.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.53.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.53.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.53.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.54.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.54.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.54.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.55.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.55.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.55.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.56.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.56.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.56.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.57.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.57.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.57.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.58.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.58.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.58.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.59.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.59.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.59.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.6.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.6.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.6.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.60.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.60.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.60.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.61.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.61.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.61.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.62.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.62.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.62.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.63.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.63.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.63.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.64.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.64.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.64.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.65.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.65.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.65.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.66.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.66.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.66.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.67.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.67.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.67.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.68.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.68.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.68.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.69.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.69.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.69.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.7.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.7.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.7.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.70.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.70.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.70.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.71.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.71.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.71.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.72.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.72.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.72.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.73.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.73.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.73.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.74.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.74.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.74.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.75.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.75.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.75.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.76.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.76.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.76.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.77.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.77.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.77.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.78.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.78.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.78.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.79.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.79.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.79.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.8.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.8.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.8.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.80.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.80.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.80.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.81.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.81.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.81.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.82.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.82.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.82.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.83.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.83.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.83.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.84.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.84.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.84.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.85.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.85.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.85.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.86.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.86.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.86.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.87.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.87.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.87.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.88.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.88.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.88.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.89.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.89.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.89.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.9.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.9.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.9.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.90.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.90.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.90.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.91.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.91.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.91.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.92.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.92.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.92.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.93.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.93.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.93.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.94.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.94.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.94.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.95.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.95.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.95.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.96.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.96.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.96.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.97.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.97.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.97.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.98.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.98.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.98.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.99.down_proj.weight": "model-00003-of-00049.safetensors",
+ "model.layers.3.mlp.experts.99.gate_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.experts.99.up_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.mlp.gate.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.self_attn.k_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.self_attn.o_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.self_attn.q_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.3.self_attn.v_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.30.input_layernorm.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.0.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.0.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.0.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.1.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.1.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.1.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.10.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.10.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.10.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.100.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.100.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.100.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.101.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.101.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.101.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.102.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.102.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.102.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.103.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.103.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.103.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.104.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.104.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.104.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.105.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.105.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.105.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.106.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.106.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.106.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.107.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.107.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.107.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.108.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.108.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.108.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.109.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.109.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.109.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.11.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.11.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.11.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.110.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.110.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.110.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.111.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.111.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.111.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.112.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.112.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.112.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.113.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.113.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.113.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.114.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.114.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.114.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.115.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.115.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.115.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.116.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.116.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.116.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.117.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.117.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.117.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.118.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.118.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.118.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.119.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.119.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.119.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.12.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.12.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.12.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.120.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.120.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.120.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.121.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.121.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.121.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.122.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.122.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.122.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.123.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.123.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.123.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.124.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.124.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.124.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.125.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.125.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.125.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.126.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.126.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.126.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.127.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.127.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.127.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.13.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.13.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.13.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.14.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.14.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.14.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.15.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.15.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.15.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.16.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.16.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.16.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.17.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.17.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.17.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.18.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.18.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.18.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.19.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.19.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.19.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.2.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.2.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.2.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.20.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.20.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.20.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.21.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.21.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.21.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.22.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.22.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.22.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.23.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.23.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.23.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.24.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.24.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.24.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.25.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.25.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.25.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.26.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.26.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.26.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.27.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.27.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.27.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.28.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.28.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.28.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.29.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.29.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.29.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.3.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.3.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.3.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.30.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.30.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.30.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.31.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.31.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.31.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.32.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.32.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.32.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.33.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.33.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.33.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.34.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.34.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.34.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.35.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.35.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.35.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.36.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.36.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.36.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.37.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.37.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.37.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.38.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.38.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.38.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.39.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.39.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.39.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.4.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.4.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.4.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.40.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.40.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.40.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.41.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.41.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.41.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.42.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.42.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.42.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.43.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.43.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.43.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.44.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.44.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.44.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.45.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.45.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.45.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.46.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.46.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.46.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.47.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.47.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.47.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.48.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.48.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.48.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.49.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.49.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.49.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.5.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.5.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.5.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.50.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.50.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.50.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.51.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.51.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.51.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.52.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.52.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.52.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.53.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.53.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.53.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.54.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.54.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.54.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.55.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.55.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.55.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.56.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.56.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.56.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.57.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.57.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.57.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.58.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.58.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.58.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.59.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.59.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.59.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.6.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.6.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.6.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.60.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.60.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.60.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.61.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.61.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.61.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.62.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.62.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.62.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.63.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.63.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.63.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.64.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.64.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.64.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.65.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.65.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.65.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.66.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.66.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.66.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.67.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.67.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.67.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.68.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.68.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.68.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.69.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.69.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.69.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.7.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.7.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.7.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.70.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.70.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.70.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.71.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.71.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.71.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.72.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.72.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.72.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.73.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.73.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.73.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.74.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.74.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.74.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.75.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.75.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.75.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.76.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.76.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.76.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.77.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.77.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.77.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.78.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.78.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.78.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.79.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.79.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.79.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.8.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.8.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.8.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.80.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.80.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.80.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.81.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.81.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.81.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.82.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.82.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.82.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.83.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.83.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.83.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.84.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.84.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.84.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.85.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.85.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.85.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.86.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.86.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.86.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.87.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.87.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.87.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.88.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.88.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.88.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.89.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.89.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.89.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.9.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.9.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.9.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.90.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.90.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.90.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.91.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.91.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.91.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.92.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.92.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.92.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.93.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.93.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.93.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.94.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.94.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.94.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.95.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.95.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.95.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.96.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.96.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.96.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.97.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.97.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.97.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.98.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.98.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.98.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.99.down_proj.weight": "model-00030-of-00049.safetensors",
+ "model.layers.30.mlp.experts.99.gate_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.experts.99.up_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.mlp.gate.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.self_attn.k_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.self_attn.o_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.self_attn.q_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.30.self_attn.v_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.input_layernorm.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.0.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.0.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.0.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.1.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.1.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.1.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.10.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.10.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.10.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.100.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.100.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.100.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.101.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.101.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.101.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.102.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.102.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.102.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.103.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.103.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.103.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.104.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.104.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.104.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.105.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.105.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.105.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.106.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.106.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.106.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.107.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.107.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.107.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.108.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.108.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.108.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.109.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.109.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.109.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.11.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.11.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.11.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.110.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.110.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.110.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.111.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.111.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.111.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.112.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.112.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.112.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.113.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.113.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.113.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.114.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.114.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.114.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.115.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.115.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.115.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.116.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.116.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.116.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.117.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.117.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.117.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.118.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.118.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.118.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.119.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.119.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.119.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.12.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.12.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.12.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.120.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.120.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.120.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.121.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.121.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.121.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.122.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.122.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.122.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.123.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.123.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.123.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.124.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.124.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.124.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.125.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.125.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.125.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.126.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.126.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.126.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.127.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.127.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.127.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.13.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.13.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.13.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.14.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.14.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.14.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.15.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.15.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.15.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.16.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.16.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.16.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.17.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.17.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.17.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.18.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.18.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.18.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.19.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.19.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.19.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.2.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.2.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.2.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.20.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.20.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.20.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.21.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.21.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.21.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.22.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.22.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.22.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.23.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.23.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.23.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.24.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.24.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.24.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.25.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.25.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.25.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.26.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.26.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.26.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.27.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.27.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.27.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.28.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.28.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.28.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.29.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.29.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.29.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.3.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.3.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.3.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.30.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.30.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.30.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.31.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.31.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.31.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.32.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.32.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.32.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.33.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.33.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.33.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.34.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.34.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.34.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.35.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.35.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.35.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.36.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.36.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.36.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.37.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.37.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.37.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.38.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.38.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.38.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.39.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.39.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.39.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.4.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.4.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.4.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.40.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.40.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.40.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.41.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.41.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.41.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.42.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.42.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.42.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.43.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.43.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.43.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.44.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.44.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.44.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.45.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.45.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.45.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.46.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.46.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.46.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.47.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.47.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.47.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.48.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.48.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.48.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.49.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.49.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.49.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.5.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.5.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.5.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.50.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.50.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.50.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.51.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.51.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.51.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.52.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.52.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.52.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.53.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.53.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.53.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.54.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.54.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.54.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.55.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.55.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.55.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.56.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.56.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.56.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.57.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.57.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.57.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.58.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.58.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.58.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.59.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.59.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.59.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.6.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.6.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.6.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.60.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.60.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.60.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.61.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.61.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.61.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.62.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.62.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.62.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.63.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.63.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.63.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.64.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.64.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.64.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.65.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.65.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.65.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.66.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.66.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.66.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.67.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.67.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.67.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.68.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.68.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.68.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.69.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.69.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.69.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.7.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.7.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.7.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.70.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.70.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.70.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.71.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.71.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.71.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.72.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.72.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.72.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.73.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.73.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.73.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.74.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.74.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.74.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.75.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.75.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.75.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.76.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.76.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.76.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.77.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.77.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.77.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.78.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.78.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.78.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.79.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.79.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.79.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.8.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.8.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.8.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.80.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.80.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.80.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.81.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.81.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.81.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.82.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.82.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.82.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.83.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.83.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.83.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.84.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.84.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.84.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.85.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.85.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.85.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.86.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.86.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.86.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.87.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.87.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.87.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.88.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.88.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.88.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.89.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.89.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.89.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.9.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.9.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.9.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.90.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.90.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.90.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.91.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.91.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.91.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.92.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.92.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.92.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.93.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.93.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.93.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.94.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.94.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.94.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.95.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.95.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.95.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.96.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.96.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.96.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.97.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.97.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.97.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.98.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.98.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.98.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.99.down_proj.weight": "model-00031-of-00049.safetensors",
+ "model.layers.31.mlp.experts.99.gate_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.experts.99.up_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.mlp.gate.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.self_attn.k_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.self_attn.o_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.self_attn.q_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.31.self_attn.v_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.input_layernorm.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.0.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.0.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.0.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.1.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.1.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.1.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.10.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.10.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.10.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.100.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.100.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.100.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.101.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.101.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.101.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.102.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.102.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.102.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.103.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.103.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.103.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.104.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.104.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.104.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.105.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.105.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.105.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.106.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.106.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.106.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.107.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.107.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.107.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.108.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.108.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.108.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.109.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.109.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.109.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.11.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.11.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.11.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.110.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.110.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.110.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.111.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.111.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.111.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.112.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.112.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.112.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.113.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.113.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.113.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.114.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.114.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.114.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.115.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.115.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.115.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.116.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.116.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.116.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.117.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.117.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.117.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.118.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.118.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.118.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.119.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.119.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.119.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.12.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.12.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.12.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.120.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.120.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.120.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.121.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.121.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.121.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.122.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.122.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.122.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.123.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.123.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.123.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.124.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.124.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.124.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.125.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.125.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.125.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.126.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.126.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.126.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.127.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.127.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.127.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.13.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.13.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.13.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.14.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.14.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.14.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.15.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.15.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.15.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.16.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.16.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.16.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.17.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.17.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.17.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.18.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.18.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.18.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.19.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.19.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.19.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.2.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.2.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.2.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.20.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.20.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.20.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.21.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.21.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.21.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.22.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.22.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.22.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.23.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.23.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.23.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.24.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.24.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.24.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.25.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.25.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.25.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.26.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.26.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.26.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.27.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.27.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.27.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.28.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.28.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.28.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.29.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.29.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.29.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.3.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.3.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.3.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.30.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.30.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.30.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.31.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.31.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.31.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.32.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.32.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.32.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.33.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.33.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.33.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.34.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.34.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.34.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.35.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.35.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.35.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.36.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.36.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.36.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.37.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.37.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.37.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.38.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.38.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.38.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.39.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.39.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.39.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.4.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.4.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.4.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.40.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.40.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.40.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.41.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.41.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.41.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.42.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.42.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.42.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.43.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.43.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.43.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.44.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.44.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.44.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.45.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.45.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.45.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.46.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.46.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.46.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.47.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.47.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.47.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.48.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.48.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.48.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.49.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.49.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.49.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.5.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.5.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.5.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.50.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.50.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.50.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.51.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.51.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.51.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.52.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.52.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.52.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.53.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.53.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.53.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.54.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.54.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.54.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.55.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.55.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.55.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.56.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.56.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.56.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.57.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.57.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.57.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.58.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.58.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.58.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.59.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.59.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.59.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.6.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.6.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.6.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.60.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.60.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.60.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.61.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.61.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.61.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.62.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.62.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.62.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.63.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.63.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.63.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.64.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.64.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.64.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.65.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.65.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.65.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.66.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.66.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.66.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.67.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.67.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.67.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.68.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.68.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.68.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.69.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.69.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.69.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.7.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.7.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.7.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.70.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.70.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.70.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.71.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.71.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.71.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.72.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.72.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.72.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.73.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.73.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.73.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.74.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.74.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.74.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.75.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.75.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.75.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.76.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.76.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.76.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.77.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.77.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.77.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.78.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.78.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.78.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.79.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.79.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.79.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.8.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.8.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.8.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.80.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.80.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.80.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.81.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.81.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.81.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.82.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.82.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.82.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.83.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.83.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.83.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.84.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.84.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.84.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.85.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.85.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.85.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.86.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.86.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.86.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.87.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.87.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.87.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.88.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.88.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.88.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.89.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.89.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.89.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.9.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.9.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.9.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.90.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.90.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.90.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.91.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.91.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.91.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.92.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.92.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.92.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.93.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.93.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.93.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.94.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.94.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.94.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.95.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.95.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.95.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.96.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.96.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.96.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.97.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.97.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.97.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.98.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.98.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.98.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.99.down_proj.weight": "model-00032-of-00049.safetensors",
+ "model.layers.32.mlp.experts.99.gate_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.experts.99.up_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.mlp.gate.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.self_attn.k_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.self_attn.o_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.self_attn.q_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.32.self_attn.v_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.input_layernorm.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.0.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.0.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.0.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.1.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.1.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.1.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.10.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.10.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.10.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.100.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.100.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.100.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.101.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.101.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.101.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.102.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.102.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.102.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.103.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.103.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.103.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.104.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.104.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.104.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.105.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.105.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.105.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.106.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.106.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.106.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.107.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.107.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.107.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.108.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.108.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.108.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.109.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.109.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.109.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.11.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.11.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.11.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.110.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.110.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.110.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.111.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.111.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.111.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.112.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.112.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.112.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.113.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.113.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.113.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.114.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.114.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.114.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.115.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.115.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.115.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.116.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.116.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.116.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.117.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.117.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.117.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.118.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.118.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.118.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.119.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.119.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.119.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.12.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.12.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.12.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.120.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.120.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.120.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.121.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.121.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.121.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.122.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.122.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.122.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.123.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.123.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.123.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.124.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.124.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.124.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.125.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.125.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.125.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.126.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.126.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.126.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.127.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.127.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.127.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.13.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.13.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.13.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.14.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.14.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.14.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.15.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.15.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.15.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.16.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.16.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.16.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.17.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.17.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.17.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.18.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.18.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.18.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.19.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.19.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.19.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.2.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.2.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.2.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.20.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.20.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.20.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.21.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.21.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.21.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.22.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.22.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.22.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.23.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.23.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.23.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.24.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.24.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.24.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.25.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.25.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.25.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.26.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.26.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.26.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.27.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.27.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.27.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.28.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.28.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.28.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.29.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.29.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.29.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.3.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.3.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.3.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.30.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.30.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.30.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.31.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.31.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.31.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.32.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.32.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.32.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.33.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.33.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.33.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.34.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.34.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.34.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.35.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.35.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.35.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.36.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.36.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.36.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.37.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.37.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.37.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.38.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.38.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.38.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.39.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.39.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.39.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.4.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.4.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.4.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.40.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.40.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.40.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.41.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.41.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.41.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.42.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.42.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.42.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.43.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.43.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.43.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.44.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.44.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.44.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.45.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.45.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.45.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.46.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.46.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.46.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.47.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.47.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.47.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.48.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.48.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.48.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.49.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.49.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.49.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.5.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.5.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.5.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.50.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.50.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.50.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.51.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.51.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.51.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.52.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.52.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.52.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.53.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.53.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.53.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.54.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.54.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.54.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.55.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.55.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.55.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.56.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.56.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.56.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.57.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.57.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.57.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.58.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.58.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.58.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.59.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.59.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.59.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.6.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.6.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.6.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.60.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.60.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.60.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.61.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.61.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.61.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.62.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.62.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.62.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.63.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.63.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.63.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.64.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.64.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.64.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.65.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.65.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.65.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.66.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.66.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.66.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.67.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.67.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.67.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.68.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.68.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.68.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.69.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.69.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.69.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.7.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.7.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.7.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.70.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.70.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.70.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.71.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.71.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.71.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.72.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.72.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.72.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.73.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.73.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.73.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.74.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.74.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.74.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.75.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.75.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.75.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.76.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.76.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.76.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.77.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.77.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.77.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.78.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.78.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.78.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.79.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.79.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.79.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.8.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.8.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.8.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.80.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.80.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.80.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.81.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.81.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.81.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.82.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.82.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.82.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.83.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.83.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.83.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.84.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.84.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.84.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.85.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.85.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.85.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.86.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.86.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.86.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.87.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.87.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.87.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.88.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.88.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.88.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.89.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.89.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.89.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.9.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.9.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.9.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.90.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.90.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.90.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.91.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.91.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.91.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.92.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.92.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.92.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.93.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.93.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.93.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.94.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.94.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.94.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.95.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.95.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.95.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.96.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.96.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.96.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.97.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.97.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.97.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.98.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.98.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.98.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.99.down_proj.weight": "model-00033-of-00049.safetensors",
+ "model.layers.33.mlp.experts.99.gate_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.experts.99.up_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.mlp.gate.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.self_attn.k_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.self_attn.o_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.self_attn.q_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.33.self_attn.v_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.input_layernorm.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.0.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.0.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.0.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.1.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.1.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.1.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.10.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.10.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.10.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.100.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.100.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.100.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.101.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.101.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.101.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.102.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.102.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.102.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.103.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.103.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.103.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.104.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.104.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.104.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.105.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.105.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.105.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.106.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.106.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.106.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.107.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.107.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.107.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.108.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.108.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.108.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.109.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.109.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.109.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.11.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.11.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.11.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.110.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.110.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.110.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.111.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.111.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.111.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.112.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.112.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.112.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.113.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.113.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.113.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.114.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.114.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.114.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.115.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.115.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.115.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.116.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.116.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.116.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.117.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.117.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.117.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.118.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.118.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.118.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.119.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.119.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.119.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.12.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.12.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.12.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.120.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.120.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.120.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.121.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.121.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.121.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.122.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.122.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.122.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.123.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.123.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.123.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.124.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.124.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.124.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.125.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.125.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.125.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.126.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.126.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.126.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.127.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.127.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.127.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.13.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.13.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.13.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.14.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.14.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.14.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.15.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.15.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.15.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.16.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.16.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.16.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.17.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.17.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.17.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.18.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.18.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.18.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.19.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.19.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.19.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.2.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.2.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.2.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.20.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.20.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.20.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.21.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.21.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.21.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.22.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.22.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.22.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.23.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.23.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.23.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.24.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.24.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.24.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.25.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.25.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.25.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.26.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.26.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.26.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.27.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.27.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.27.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.28.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.28.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.28.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.29.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.29.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.29.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.3.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.3.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.3.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.30.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.30.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.30.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.31.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.31.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.31.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.32.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.32.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.32.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.33.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.33.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.33.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.34.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.34.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.34.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.35.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.35.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.35.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.36.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.36.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.36.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.37.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.37.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.37.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.38.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.38.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.38.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.39.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.39.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.39.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.4.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.4.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.4.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.40.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.40.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.40.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.41.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.41.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.41.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.42.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.42.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.42.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.43.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.43.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.43.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.44.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.44.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.44.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.45.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.45.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.45.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.46.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.46.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.46.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.47.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.47.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.47.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.48.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.48.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.48.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.49.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.49.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.49.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.5.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.5.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.5.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.50.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.50.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.50.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.51.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.51.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.51.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.52.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.52.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.52.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.53.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.53.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.53.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.54.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.54.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.54.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.55.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.55.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.55.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.56.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.56.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.56.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.57.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.57.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.57.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.58.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.58.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.58.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.59.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.59.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.59.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.6.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.6.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.6.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.60.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.60.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.60.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.61.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.61.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.61.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.62.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.62.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.62.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.63.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.63.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.63.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.64.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.64.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.64.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.65.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.65.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.65.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.66.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.66.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.66.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.67.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.67.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.67.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.68.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.68.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.68.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.69.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.69.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.69.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.7.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.7.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.7.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.70.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.70.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.70.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.71.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.71.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.71.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.72.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.72.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.72.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.73.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.73.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.73.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.74.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.74.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.74.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.75.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.75.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.75.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.76.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.76.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.76.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.77.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.77.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.77.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.78.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.78.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.78.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.79.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.79.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.79.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.8.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.8.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.8.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.80.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.80.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.80.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.81.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.81.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.81.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.82.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.82.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.82.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.83.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.83.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.83.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.84.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.84.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.84.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.85.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.85.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.85.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.86.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.86.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.86.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.87.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.87.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.87.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.88.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.88.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.88.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.89.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.89.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.89.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.9.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.9.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.9.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.90.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.90.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.90.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.91.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.91.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.91.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.92.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.92.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.92.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.93.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.93.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.93.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.94.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.94.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.94.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.95.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.95.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.95.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.96.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.96.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.96.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.97.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.97.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.97.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.98.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.98.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.98.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.99.down_proj.weight": "model-00034-of-00049.safetensors",
+ "model.layers.34.mlp.experts.99.gate_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.experts.99.up_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.mlp.gate.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.self_attn.k_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.self_attn.o_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.self_attn.q_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.34.self_attn.v_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.input_layernorm.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.0.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.0.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.0.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.1.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.1.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.1.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.10.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.10.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.10.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.100.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.100.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.100.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.101.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.101.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.101.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.102.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.102.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.102.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.103.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.103.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.103.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.104.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.104.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.104.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.105.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.105.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.105.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.106.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.106.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.106.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.107.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.107.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.107.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.108.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.108.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.108.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.109.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.109.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.109.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.11.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.11.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.11.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.110.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.110.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.110.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.111.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.111.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.111.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.112.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.112.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.112.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.113.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.113.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.113.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.114.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.114.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.114.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.115.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.115.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.115.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.116.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.116.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.116.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.117.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.117.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.117.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.118.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.118.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.118.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.119.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.119.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.119.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.12.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.12.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.12.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.120.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.120.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.120.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.121.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.121.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.121.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.122.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.122.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.122.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.123.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.123.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.123.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.124.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.124.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.124.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.125.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.125.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.125.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.126.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.126.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.126.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.127.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.127.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.127.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.13.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.13.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.13.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.14.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.14.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.14.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.15.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.15.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.15.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.16.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.16.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.16.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.17.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.17.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.17.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.18.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.18.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.18.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.19.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.19.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.19.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.2.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.2.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.2.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.20.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.20.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.20.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.21.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.21.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.21.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.22.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.22.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.22.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.23.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.23.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.23.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.24.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.24.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.24.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.25.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.25.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.25.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.26.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.26.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.26.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.27.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.27.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.27.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.28.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.28.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.28.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.29.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.29.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.29.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.3.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.3.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.3.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.30.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.30.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.30.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.31.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.31.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.31.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.32.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.32.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.32.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.33.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.33.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.33.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.34.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.34.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.34.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.35.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.35.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.35.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.36.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.36.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.36.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.37.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.37.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.37.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.38.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.38.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.38.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.39.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.39.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.39.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.4.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.4.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.4.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.40.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.40.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.40.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.41.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.41.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.41.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.42.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.42.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.42.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.43.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.43.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.43.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.44.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.44.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.44.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.45.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.45.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.45.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.46.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.46.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.46.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.47.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.47.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.47.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.48.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.48.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.48.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.49.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.49.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.49.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.5.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.5.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.5.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.50.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.50.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.50.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.51.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.51.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.51.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.52.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.52.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.52.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.53.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.53.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.53.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.54.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.54.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.54.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.55.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.55.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.55.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.56.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.56.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.56.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.57.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.57.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.57.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.58.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.58.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.58.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.59.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.59.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.59.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.6.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.6.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.6.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.60.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.60.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.60.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.61.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.61.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.61.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.62.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.62.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.62.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.63.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.63.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.63.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.64.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.64.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.64.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.65.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.65.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.65.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.66.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.66.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.66.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.67.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.67.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.67.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.68.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.68.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.68.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.69.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.69.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.69.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.7.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.7.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.7.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.70.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.70.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.70.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.71.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.71.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.71.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.72.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.72.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.72.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.73.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.73.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.73.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.74.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.74.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.74.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.75.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.75.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.75.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.76.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.76.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.76.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.77.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.77.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.77.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.78.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.78.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.78.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.79.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.79.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.79.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.8.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.8.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.8.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.80.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.80.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.80.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.81.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.81.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.81.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.82.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.82.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.82.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.83.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.83.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.83.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.84.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.84.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.84.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.85.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.85.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.85.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.86.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.86.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.86.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.87.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.87.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.87.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.88.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.88.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.88.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.89.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.89.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.89.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.9.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.9.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.9.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.90.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.90.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.90.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.91.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.91.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.91.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.92.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.92.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.92.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.93.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.93.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.93.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.94.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.94.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.94.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.95.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.95.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.95.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.96.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.96.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.96.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.97.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.97.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.97.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.98.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.98.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.98.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.99.down_proj.weight": "model-00035-of-00049.safetensors",
+ "model.layers.35.mlp.experts.99.gate_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.experts.99.up_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.mlp.gate.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.self_attn.k_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.self_attn.o_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.self_attn.q_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.35.self_attn.v_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.input_layernorm.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.0.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.0.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.0.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.1.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.1.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.1.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.10.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.10.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.10.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.100.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.100.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.100.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.101.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.101.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.101.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.102.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.102.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.102.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.103.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.103.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.103.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.104.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.104.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.104.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.105.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.105.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.105.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.106.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.106.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.106.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.107.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.107.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.107.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.108.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.108.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.108.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.109.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.109.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.109.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.11.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.11.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.11.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.110.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.110.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.110.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.111.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.111.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.111.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.112.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.112.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.112.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.113.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.113.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.113.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.114.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.114.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.114.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.115.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.115.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.115.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.116.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.116.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.116.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.117.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.117.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.117.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.118.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.118.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.118.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.119.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.119.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.119.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.12.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.12.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.12.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.120.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.120.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.120.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.121.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.121.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.121.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.122.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.122.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.122.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.123.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.123.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.123.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.124.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.124.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.124.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.125.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.125.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.125.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.126.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.126.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.126.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.127.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.127.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.127.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.13.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.13.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.13.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.14.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.14.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.14.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.15.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.15.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.15.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.16.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.16.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.16.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.17.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.17.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.17.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.18.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.18.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.18.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.19.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.19.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.19.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.2.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.2.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.2.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.20.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.20.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.20.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.21.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.21.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.21.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.22.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.22.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.22.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.23.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.23.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.23.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.24.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.24.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.24.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.25.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.25.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.25.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.26.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.26.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.26.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.27.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.27.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.27.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.28.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.28.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.28.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.29.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.29.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.29.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.3.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.3.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.3.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.30.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.30.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.30.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.31.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.31.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.31.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.32.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.32.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.32.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.33.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.33.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.33.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.34.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.34.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.34.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.35.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.35.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.35.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.36.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.36.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.36.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.37.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.37.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.37.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.38.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.38.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.38.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.39.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.39.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.39.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.4.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.4.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.4.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.40.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.40.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.40.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.41.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.41.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.41.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.42.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.42.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.42.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.43.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.43.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.43.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.44.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.44.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.44.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.45.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.45.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.45.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.46.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.46.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.46.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.47.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.47.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.47.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.48.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.48.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.48.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.49.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.49.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.49.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.5.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.5.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.5.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.50.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.50.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.50.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.51.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.51.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.51.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.52.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.52.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.52.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.53.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.53.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.53.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.54.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.54.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.54.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.55.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.55.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.55.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.56.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.56.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.56.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.57.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.57.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.57.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.58.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.58.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.58.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.59.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.59.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.59.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.6.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.6.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.6.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.60.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.60.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.60.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.61.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.61.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.61.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.62.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.62.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.62.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.63.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.63.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.63.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.64.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.64.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.64.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.65.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.65.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.65.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.66.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.66.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.66.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.67.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.67.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.67.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.68.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.68.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.68.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.69.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.69.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.69.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.7.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.7.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.7.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.70.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.70.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.70.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.71.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.71.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.71.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.72.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.72.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.72.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.73.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.73.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.73.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.74.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.74.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.74.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.75.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.75.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.75.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.76.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.76.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.76.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.77.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.77.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.77.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.78.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.78.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.78.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.79.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.79.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.79.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.8.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.8.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.8.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.80.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.80.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.80.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.81.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.81.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.81.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.82.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.82.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.82.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.83.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.83.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.83.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.84.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.84.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.84.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.85.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.85.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.85.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.86.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.86.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.86.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.87.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.87.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.87.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.88.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.88.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.88.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.89.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.89.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.89.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.9.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.9.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.9.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.90.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.90.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.90.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.91.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.91.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.91.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.92.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.92.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.92.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.93.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.93.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.93.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.94.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.94.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.94.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.95.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.95.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.95.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.96.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.96.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.96.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.97.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.97.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.97.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.98.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.98.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.98.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.99.down_proj.weight": "model-00036-of-00049.safetensors",
+ "model.layers.36.mlp.experts.99.gate_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.experts.99.up_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.mlp.gate.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.self_attn.k_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.self_attn.o_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.self_attn.q_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.36.self_attn.v_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.input_layernorm.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.0.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.0.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.0.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.1.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.1.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.1.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.10.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.10.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.10.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.100.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.100.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.100.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.101.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.101.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.101.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.102.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.102.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.102.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.103.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.103.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.103.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.104.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.104.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.104.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.105.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.105.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.105.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.106.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.106.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.106.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.107.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.107.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.107.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.108.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.108.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.108.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.109.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.109.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.109.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.11.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.11.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.11.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.110.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.110.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.110.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.111.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.111.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.111.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.112.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.112.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.112.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.113.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.113.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.113.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.114.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.114.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.114.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.115.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.115.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.115.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.116.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.116.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.116.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.117.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.117.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.117.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.118.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.118.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.118.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.119.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.119.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.119.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.12.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.12.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.12.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.120.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.120.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.120.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.121.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.121.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.121.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.122.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.122.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.122.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.123.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.123.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.123.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.124.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.124.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.124.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.125.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.125.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.125.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.126.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.126.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.126.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.127.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.127.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.127.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.13.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.13.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.13.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.14.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.14.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.14.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.15.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.15.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.15.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.16.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.16.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.16.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.17.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.17.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.17.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.18.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.18.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.18.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.19.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.19.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.19.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.2.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.2.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.2.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.20.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.20.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.20.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.21.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.21.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.21.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.22.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.22.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.22.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.23.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.23.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.23.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.24.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.24.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.24.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.25.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.25.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.25.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.26.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.26.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.26.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.27.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.27.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.27.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.28.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.28.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.28.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.29.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.29.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.29.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.3.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.3.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.3.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.30.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.30.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.30.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.31.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.31.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.31.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.32.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.32.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.32.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.33.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.33.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.33.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.34.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.34.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.34.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.35.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.35.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.35.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.36.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.36.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.36.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.37.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.37.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.37.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.38.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.38.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.38.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.39.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.39.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.39.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.4.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.4.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.4.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.40.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.40.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.40.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.41.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.41.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.41.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.42.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.42.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.42.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.43.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.43.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.43.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.44.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.44.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.44.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.45.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.45.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.45.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.46.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.46.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.46.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.47.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.47.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.47.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.48.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.48.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.48.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.49.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.49.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.49.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.5.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.5.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.5.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.50.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.50.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.50.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.51.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.51.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.51.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.52.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.52.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.52.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.53.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.53.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.53.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.54.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.54.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.54.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.55.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.55.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.55.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.56.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.56.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.56.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.57.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.57.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.57.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.58.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.58.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.58.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.59.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.59.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.59.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.6.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.6.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.6.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.60.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.60.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.60.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.61.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.61.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.61.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.62.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.62.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.62.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.63.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.63.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.63.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.64.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.64.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.64.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.65.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.65.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.65.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.66.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.66.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.66.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.67.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.67.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.67.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.68.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.68.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.68.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.69.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.69.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.69.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.7.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.7.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.7.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.70.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.70.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.70.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.71.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.71.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.71.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.72.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.72.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.72.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.73.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.73.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.73.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.74.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.74.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.74.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.75.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.75.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.75.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.76.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.76.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.76.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.77.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.77.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.77.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.78.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.78.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.78.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.79.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.79.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.79.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.8.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.8.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.8.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.80.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.80.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.80.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.81.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.81.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.81.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.82.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.82.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.82.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.83.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.83.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.83.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.84.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.84.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.84.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.85.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.85.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.85.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.86.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.86.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.86.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.87.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.87.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.87.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.88.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.88.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.88.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.89.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.89.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.89.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.9.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.9.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.9.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.90.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.90.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.90.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.91.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.91.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.91.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.92.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.92.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.92.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.93.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.93.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.93.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.94.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.94.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.94.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.95.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.95.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.95.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.96.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.96.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.96.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.97.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.97.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.97.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.98.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.98.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.98.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.99.down_proj.weight": "model-00037-of-00049.safetensors",
+ "model.layers.37.mlp.experts.99.gate_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.experts.99.up_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.mlp.gate.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.self_attn.k_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.self_attn.o_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.self_attn.q_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.37.self_attn.v_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.input_layernorm.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.0.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.0.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.0.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.1.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.1.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.1.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.10.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.10.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.10.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.100.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.100.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.100.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.101.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.101.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.101.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.102.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.102.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.102.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.103.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.103.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.103.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.104.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.104.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.104.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.105.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.105.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.105.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.106.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.106.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.106.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.107.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.107.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.107.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.108.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.108.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.108.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.109.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.109.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.109.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.11.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.11.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.11.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.110.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.110.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.110.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.111.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.111.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.111.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.112.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.112.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.112.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.113.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.113.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.113.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.114.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.114.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.114.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.115.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.115.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.115.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.116.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.116.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.116.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.117.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.117.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.117.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.118.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.118.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.118.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.119.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.119.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.119.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.12.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.12.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.12.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.120.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.120.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.120.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.121.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.121.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.121.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.122.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.122.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.122.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.123.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.123.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.123.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.124.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.124.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.124.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.125.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.125.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.125.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.126.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.126.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.126.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.127.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.127.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.127.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.13.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.13.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.13.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.14.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.14.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.14.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.15.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.15.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.15.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.16.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.16.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.16.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.17.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.17.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.17.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.18.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.18.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.18.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.19.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.19.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.19.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.2.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.2.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.2.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.20.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.20.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.20.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.21.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.21.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.21.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.22.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.22.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.22.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.23.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.23.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.23.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.24.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.24.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.24.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.25.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.25.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.25.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.26.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.26.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.26.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.27.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.27.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.27.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.28.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.28.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.28.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.29.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.29.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.29.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.3.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.3.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.3.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.30.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.30.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.30.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.31.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.31.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.31.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.32.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.32.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.32.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.33.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.33.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.33.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.34.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.34.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.34.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.35.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.35.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.35.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.36.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.36.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.36.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.37.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.37.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.37.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.38.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.38.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.38.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.39.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.39.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.39.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.4.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.4.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.4.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.40.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.40.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.40.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.41.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.41.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.41.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.42.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.42.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.42.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.43.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.43.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.43.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.44.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.44.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.44.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.45.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.45.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.45.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.46.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.46.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.46.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.47.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.47.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.47.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.48.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.48.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.48.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.49.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.49.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.49.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.5.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.5.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.5.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.50.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.50.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.50.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.51.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.51.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.51.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.52.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.52.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.52.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.53.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.53.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.53.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.54.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.54.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.54.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.55.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.55.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.55.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.56.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.56.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.56.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.57.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.57.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.57.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.58.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.58.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.58.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.59.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.59.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.59.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.6.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.6.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.6.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.60.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.60.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.60.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.61.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.61.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.61.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.62.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.62.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.62.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.63.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.63.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.63.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.64.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.64.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.64.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.65.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.65.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.65.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.66.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.66.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.66.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.67.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.67.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.67.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.68.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.68.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.68.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.69.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.69.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.69.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.7.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.7.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.7.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.70.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.70.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.70.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.71.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.71.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.71.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.72.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.72.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.72.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.73.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.73.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.73.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.74.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.74.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.74.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.75.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.75.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.75.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.76.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.76.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.76.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.77.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.77.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.77.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.78.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.78.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.78.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.79.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.79.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.79.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.8.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.8.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.8.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.80.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.80.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.80.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.81.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.81.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.81.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.82.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.82.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.82.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.83.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.83.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.83.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.84.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.84.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.84.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.85.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.85.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.85.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.86.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.86.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.86.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.87.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.87.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.87.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.88.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.88.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.88.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.89.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.89.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.89.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.9.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.9.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.9.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.90.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.90.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.90.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.91.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.91.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.91.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.92.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.92.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.92.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.93.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.93.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.93.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.94.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.94.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.94.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.95.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.95.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.95.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.96.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.96.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.96.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.97.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.97.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.97.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.98.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.98.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.98.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.99.down_proj.weight": "model-00038-of-00049.safetensors",
+ "model.layers.38.mlp.experts.99.gate_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.experts.99.up_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.mlp.gate.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.self_attn.k_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.self_attn.o_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.self_attn.q_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.38.self_attn.v_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.input_layernorm.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.0.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.0.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.0.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.1.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.1.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.1.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.10.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.10.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.10.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.100.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.100.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.100.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.101.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.101.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.101.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.102.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.102.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.102.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.103.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.103.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.103.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.104.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.104.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.104.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.105.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.105.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.105.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.106.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.106.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.106.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.107.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.107.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.107.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.108.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.108.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.108.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.109.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.109.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.109.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.11.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.11.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.11.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.110.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.110.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.110.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.111.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.111.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.111.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.112.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.112.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.112.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.113.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.113.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.113.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.114.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.114.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.114.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.115.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.115.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.115.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.116.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.116.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.116.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.117.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.117.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.117.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.118.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.118.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.118.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.119.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.119.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.119.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.12.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.12.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.12.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.120.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.120.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.120.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.121.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.121.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.121.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.122.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.122.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.122.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.123.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.123.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.123.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.124.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.124.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.124.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.125.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.125.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.125.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.126.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.126.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.126.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.127.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.127.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.127.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.13.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.13.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.13.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.14.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.14.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.14.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.15.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.15.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.15.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.16.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.16.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.16.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.17.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.17.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.17.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.18.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.18.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.18.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.19.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.19.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.19.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.2.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.2.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.2.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.20.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.20.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.20.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.21.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.21.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.21.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.22.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.22.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.22.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.23.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.23.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.23.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.24.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.24.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.24.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.25.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.25.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.25.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.26.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.26.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.26.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.27.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.27.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.27.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.28.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.28.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.28.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.29.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.29.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.29.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.3.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.3.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.3.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.30.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.30.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.30.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.31.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.31.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.31.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.32.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.32.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.32.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.33.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.33.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.33.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.34.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.34.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.34.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.35.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.35.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.35.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.36.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.36.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.36.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.37.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.37.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.37.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.38.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.38.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.38.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.39.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.39.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.39.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.4.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.4.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.4.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.40.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.40.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.40.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.41.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.41.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.41.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.42.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.42.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.42.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.43.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.43.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.43.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.44.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.44.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.44.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.45.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.45.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.45.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.46.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.46.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.46.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.47.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.47.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.47.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.48.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.48.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.48.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.49.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.49.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.49.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.5.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.5.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.5.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.50.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.50.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.50.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.51.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.51.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.51.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.52.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.52.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.52.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.53.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.53.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.53.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.54.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.54.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.54.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.55.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.55.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.55.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.56.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.56.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.56.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.57.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.57.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.57.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.58.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.58.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.58.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.59.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.59.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.59.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.6.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.6.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.6.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.60.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.60.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.60.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.61.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.61.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.61.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.62.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.62.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.62.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.63.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.63.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.63.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.64.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.64.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.64.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.65.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.65.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.65.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.66.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.66.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.66.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.67.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.67.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.67.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.68.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.68.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.68.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.69.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.69.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.69.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.7.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.7.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.7.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.70.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.70.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.70.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.71.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.71.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.71.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.72.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.72.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.72.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.73.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.73.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.73.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.74.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.74.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.74.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.75.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.75.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.75.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.76.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.76.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.76.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.77.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.77.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.77.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.78.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.78.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.78.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.79.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.79.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.79.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.8.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.8.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.8.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.80.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.80.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.80.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.81.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.81.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.81.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.82.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.82.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.82.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.83.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.83.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.83.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.84.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.84.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.84.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.85.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.85.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.85.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.86.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.86.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.86.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.87.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.87.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.87.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.88.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.88.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.88.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.89.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.89.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.89.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.9.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.9.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.9.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.90.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.90.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.90.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.91.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.91.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.91.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.92.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.92.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.92.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.93.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.93.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.93.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.94.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.94.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.94.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.95.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.95.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.95.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.96.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.96.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.96.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.97.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.97.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.97.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.98.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.98.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.98.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.99.down_proj.weight": "model-00039-of-00049.safetensors",
+ "model.layers.39.mlp.experts.99.gate_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.experts.99.up_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.mlp.gate.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.self_attn.k_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.self_attn.o_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.self_attn.q_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.39.self_attn.v_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.4.input_layernorm.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.0.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.0.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.0.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.1.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.1.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.1.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.10.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.10.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.10.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.100.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.100.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.100.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.101.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.101.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.101.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.102.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.102.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.102.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.103.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.103.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.103.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.104.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.104.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.104.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.105.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.105.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.105.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.106.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.106.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.106.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.107.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.107.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.107.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.108.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.108.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.108.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.109.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.109.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.109.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.11.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.11.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.11.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.110.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.110.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.110.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.111.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.111.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.111.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.112.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.112.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.112.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.113.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.113.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.113.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.114.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.114.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.114.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.115.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.115.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.115.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.116.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.116.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.116.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.117.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.117.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.117.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.118.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.118.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.118.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.119.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.119.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.119.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.12.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.12.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.12.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.120.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.120.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.120.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.121.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.121.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.121.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.122.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.122.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.122.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.123.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.123.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.123.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.124.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.124.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.124.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.125.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.125.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.125.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.126.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.126.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.126.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.127.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.127.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.127.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.13.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.13.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.13.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.14.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.14.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.14.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.15.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.15.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.15.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.16.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.16.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.16.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.17.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.17.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.17.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.18.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.18.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.18.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.19.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.19.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.19.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.2.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.2.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.2.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.20.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.20.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.20.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.21.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.21.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.21.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.22.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.22.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.22.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.23.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.23.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.23.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.24.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.24.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.24.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.25.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.25.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.25.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.26.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.26.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.26.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.27.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.27.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.27.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.28.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.28.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.28.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.29.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.29.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.29.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.3.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.3.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.3.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.30.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.30.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.30.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.31.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.31.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.31.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.32.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.32.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.32.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.33.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.33.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.33.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.34.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.34.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.34.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.35.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.35.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.35.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.36.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.36.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.36.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.37.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.37.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.37.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.38.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.38.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.38.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.39.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.39.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.39.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.4.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.4.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.4.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.40.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.40.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.40.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.41.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.41.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.41.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.42.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.42.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.42.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.43.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.43.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.43.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.44.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.44.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.44.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.45.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.45.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.45.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.46.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.46.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.46.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.47.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.47.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.47.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.48.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.48.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.48.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.49.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.49.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.49.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.5.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.5.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.5.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.50.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.50.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.50.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.51.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.51.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.51.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.52.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.52.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.52.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.53.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.53.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.53.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.54.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.54.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.54.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.55.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.55.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.55.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.56.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.56.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.56.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.57.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.57.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.57.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.58.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.58.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.58.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.59.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.59.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.59.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.6.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.6.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.6.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.60.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.60.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.60.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.61.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.61.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.61.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.62.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.62.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.62.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.63.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.63.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.63.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.64.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.64.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.64.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.65.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.65.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.65.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.66.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.66.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.66.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.67.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.67.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.67.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.68.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.68.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.68.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.69.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.69.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.69.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.7.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.7.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.7.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.70.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.70.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.70.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.71.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.71.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.71.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.72.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.72.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.72.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.73.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.73.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.73.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.74.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.74.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.74.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.75.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.75.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.75.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.76.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.76.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.76.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.77.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.77.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.77.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.78.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.78.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.78.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.79.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.79.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.79.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.8.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.8.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.8.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.80.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.80.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.80.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.81.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.81.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.81.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.82.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.82.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.82.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.83.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.83.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.83.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.84.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.84.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.84.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.85.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.85.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.85.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.86.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.86.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.86.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.87.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.87.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.87.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.88.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.88.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.88.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.89.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.89.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.89.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.9.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.9.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.9.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.90.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.90.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.90.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.91.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.91.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.91.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.92.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.92.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.92.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.93.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.93.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.93.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.94.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.94.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.94.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.95.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.95.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.95.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.96.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.96.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.96.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.97.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.97.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.97.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.98.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.98.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.98.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.99.down_proj.weight": "model-00004-of-00049.safetensors",
+ "model.layers.4.mlp.experts.99.gate_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.experts.99.up_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.mlp.gate.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.self_attn.k_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.self_attn.o_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.self_attn.q_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.4.self_attn.v_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.40.input_layernorm.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.0.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.0.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.0.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.1.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.1.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.1.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.10.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.10.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.10.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.100.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.100.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.100.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.101.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.101.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.101.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.102.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.102.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.102.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.103.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.103.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.103.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.104.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.104.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.104.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.105.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.105.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.105.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.106.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.106.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.106.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.107.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.107.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.107.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.108.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.108.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.108.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.109.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.109.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.109.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.11.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.11.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.11.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.110.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.110.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.110.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.111.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.111.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.111.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.112.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.112.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.112.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.113.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.113.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.113.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.114.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.114.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.114.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.115.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.115.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.115.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.116.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.116.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.116.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.117.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.117.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.117.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.118.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.118.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.118.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.119.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.119.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.119.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.12.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.12.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.12.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.120.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.120.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.120.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.121.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.121.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.121.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.122.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.122.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.122.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.123.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.123.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.123.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.124.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.124.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.124.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.125.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.125.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.125.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.126.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.126.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.126.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.127.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.127.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.127.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.13.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.13.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.13.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.14.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.14.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.14.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.15.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.15.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.15.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.16.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.16.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.16.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.17.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.17.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.17.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.18.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.18.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.18.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.19.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.19.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.19.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.2.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.2.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.2.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.20.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.20.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.20.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.21.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.21.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.21.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.22.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.22.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.22.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.23.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.23.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.23.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.24.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.24.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.24.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.25.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.25.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.25.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.26.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.26.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.26.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.27.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.27.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.27.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.28.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.28.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.28.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.29.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.29.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.29.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.3.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.3.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.3.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.30.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.30.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.30.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.31.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.31.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.31.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.32.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.32.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.32.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.33.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.33.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.33.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.34.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.34.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.34.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.35.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.35.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.35.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.36.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.36.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.36.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.37.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.37.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.37.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.38.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.38.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.38.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.39.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.39.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.39.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.4.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.4.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.4.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.40.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.40.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.40.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.41.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.41.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.41.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.42.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.42.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.42.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.43.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.43.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.43.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.44.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.44.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.44.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.45.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.45.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.45.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.46.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.46.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.46.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.47.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.47.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.47.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.48.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.48.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.48.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.49.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.49.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.49.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.5.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.5.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.5.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.50.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.50.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.50.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.51.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.51.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.51.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.52.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.52.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.52.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.53.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.53.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.53.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.54.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.54.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.54.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.55.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.55.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.55.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.56.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.56.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.56.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.57.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.57.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.57.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.58.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.58.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.58.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.59.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.59.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.59.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.6.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.6.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.6.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.60.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.60.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.60.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.61.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.61.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.61.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.62.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.62.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.62.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.63.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.63.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.63.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.64.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.64.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.64.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.65.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.65.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.65.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.66.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.66.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.66.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.67.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.67.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.67.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.68.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.68.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.68.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.69.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.69.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.69.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.7.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.7.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.7.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.70.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.70.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.70.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.71.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.71.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.71.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.72.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.72.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.72.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.73.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.73.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.73.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.74.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.74.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.74.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.75.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.75.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.75.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.76.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.76.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.76.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.77.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.77.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.77.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.78.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.78.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.78.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.79.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.79.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.79.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.8.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.8.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.8.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.80.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.80.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.80.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.81.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.81.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.81.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.82.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.82.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.82.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.83.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.83.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.83.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.84.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.84.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.84.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.85.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.85.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.85.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.86.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.86.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.86.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.87.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.87.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.87.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.88.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.88.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.88.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.89.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.89.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.89.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.9.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.9.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.9.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.90.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.90.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.90.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.91.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.91.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.91.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.92.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.92.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.92.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.93.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.93.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.93.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.94.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.94.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.94.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.95.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.95.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.95.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.96.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.96.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.96.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.97.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.97.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.97.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.98.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.98.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.98.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.99.down_proj.weight": "model-00040-of-00049.safetensors",
+ "model.layers.40.mlp.experts.99.gate_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.experts.99.up_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.mlp.gate.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.self_attn.k_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.self_attn.o_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.self_attn.q_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.40.self_attn.v_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.input_layernorm.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.0.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.0.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.0.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.1.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.1.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.1.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.10.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.10.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.10.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.100.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.100.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.100.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.101.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.101.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.101.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.102.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.102.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.102.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.103.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.103.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.103.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.104.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.104.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.104.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.105.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.105.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.105.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.106.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.106.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.106.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.107.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.107.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.107.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.108.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.108.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.108.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.109.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.109.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.109.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.11.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.11.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.11.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.110.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.110.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.110.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.111.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.111.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.111.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.112.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.112.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.112.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.113.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.113.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.113.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.114.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.114.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.114.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.115.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.115.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.115.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.116.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.116.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.116.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.117.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.117.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.117.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.118.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.118.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.118.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.119.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.119.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.119.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.12.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.12.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.12.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.120.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.120.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.120.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.121.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.121.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.121.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.122.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.122.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.122.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.123.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.123.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.123.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.124.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.124.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.124.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.125.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.125.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.125.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.126.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.126.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.126.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.127.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.127.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.127.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.13.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.13.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.13.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.14.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.14.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.14.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.15.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.15.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.15.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.16.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.16.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.16.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.17.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.17.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.17.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.18.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.18.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.18.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.19.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.19.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.19.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.2.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.2.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.2.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.20.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.20.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.20.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.21.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.21.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.21.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.22.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.22.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.22.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.23.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.23.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.23.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.24.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.24.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.24.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.25.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.25.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.25.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.26.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.26.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.26.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.27.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.27.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.27.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.28.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.28.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.28.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.29.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.29.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.29.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.3.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.3.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.3.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.30.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.30.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.30.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.31.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.31.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.31.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.32.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.32.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.32.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.33.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.33.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.33.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.34.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.34.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.34.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.35.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.35.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.35.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.36.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.36.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.36.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.37.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.37.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.37.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.38.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.38.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.38.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.39.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.39.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.39.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.4.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.4.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.4.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.40.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.40.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.40.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.41.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.41.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.41.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.42.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.42.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.42.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.43.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.43.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.43.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.44.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.44.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.44.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.45.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.45.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.45.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.46.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.46.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.46.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.47.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.47.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.47.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.48.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.48.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.48.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.49.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.49.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.49.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.5.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.5.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.5.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.50.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.50.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.50.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.51.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.51.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.51.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.52.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.52.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.52.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.53.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.53.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.53.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.54.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.54.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.54.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.55.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.55.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.55.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.56.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.56.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.56.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.57.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.57.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.57.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.58.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.58.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.58.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.59.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.59.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.59.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.6.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.6.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.6.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.60.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.60.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.60.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.61.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.61.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.61.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.62.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.62.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.62.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.63.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.63.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.63.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.64.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.64.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.64.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.65.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.65.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.65.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.66.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.66.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.66.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.67.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.67.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.67.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.68.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.68.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.68.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.69.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.69.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.69.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.7.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.7.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.7.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.70.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.70.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.70.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.71.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.71.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.71.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.72.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.72.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.72.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.73.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.73.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.73.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.74.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.74.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.74.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.75.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.75.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.75.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.76.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.76.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.76.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.77.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.77.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.77.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.78.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.78.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.78.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.79.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.79.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.79.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.8.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.8.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.8.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.80.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.80.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.80.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.81.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.81.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.81.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.82.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.82.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.82.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.83.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.83.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.83.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.84.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.84.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.84.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.85.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.85.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.85.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.86.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.86.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.86.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.87.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.87.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.87.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.88.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.88.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.88.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.89.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.89.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.89.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.9.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.9.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.9.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.90.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.90.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.90.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.91.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.91.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.91.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.92.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.92.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.92.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.93.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.93.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.93.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.94.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.94.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.94.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.95.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.95.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.95.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.96.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.96.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.96.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.97.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.97.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.97.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.98.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.98.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.98.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.99.down_proj.weight": "model-00041-of-00049.safetensors",
+ "model.layers.41.mlp.experts.99.gate_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.experts.99.up_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.mlp.gate.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.self_attn.k_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.self_attn.o_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.self_attn.q_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.41.self_attn.v_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.input_layernorm.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.0.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.0.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.0.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.1.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.1.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.1.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.10.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.10.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.10.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.100.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.100.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.100.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.101.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.101.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.101.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.102.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.102.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.102.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.103.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.103.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.103.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.104.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.104.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.104.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.105.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.105.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.105.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.106.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.106.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.106.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.107.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.107.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.107.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.108.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.108.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.108.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.109.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.109.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.109.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.11.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.11.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.11.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.110.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.110.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.110.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.111.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.111.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.111.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.112.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.112.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.112.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.113.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.113.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.113.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.114.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.114.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.114.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.115.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.115.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.115.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.116.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.116.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.116.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.117.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.117.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.117.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.118.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.118.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.118.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.119.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.119.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.119.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.12.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.12.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.12.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.120.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.120.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.120.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.121.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.121.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.121.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.122.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.122.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.122.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.123.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.123.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.123.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.124.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.124.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.124.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.125.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.125.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.125.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.126.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.126.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.126.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.127.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.127.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.127.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.13.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.13.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.13.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.14.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.14.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.14.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.15.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.15.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.15.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.16.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.16.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.16.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.17.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.17.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.17.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.18.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.18.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.18.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.19.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.19.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.19.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.2.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.2.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.2.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.20.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.20.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.20.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.21.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.21.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.21.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.22.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.22.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.22.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.23.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.23.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.23.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.24.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.24.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.24.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.25.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.25.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.25.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.26.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.26.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.26.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.27.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.27.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.27.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.28.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.28.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.28.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.29.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.29.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.29.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.3.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.3.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.3.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.30.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.30.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.30.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.31.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.31.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.31.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.32.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.32.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.32.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.33.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.33.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.33.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.34.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.34.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.34.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.35.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.35.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.35.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.36.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.36.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.36.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.37.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.37.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.37.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.38.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.38.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.38.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.39.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.39.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.39.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.4.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.4.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.4.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.40.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.40.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.40.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.41.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.41.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.41.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.42.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.42.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.42.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.43.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.43.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.43.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.44.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.44.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.44.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.45.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.45.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.45.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.46.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.46.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.46.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.47.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.47.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.47.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.48.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.48.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.48.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.49.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.49.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.49.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.5.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.5.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.5.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.50.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.50.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.50.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.51.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.51.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.51.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.52.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.52.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.52.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.53.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.53.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.53.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.54.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.54.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.54.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.55.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.55.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.55.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.56.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.56.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.56.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.57.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.57.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.57.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.58.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.58.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.58.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.59.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.59.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.59.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.6.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.6.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.6.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.60.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.60.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.60.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.61.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.61.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.61.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.62.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.62.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.62.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.63.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.63.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.63.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.64.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.64.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.64.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.65.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.65.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.65.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.66.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.66.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.66.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.67.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.67.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.67.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.68.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.68.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.68.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.69.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.69.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.69.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.7.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.7.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.7.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.70.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.70.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.70.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.71.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.71.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.71.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.72.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.72.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.72.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.73.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.73.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.73.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.74.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.74.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.74.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.75.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.75.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.75.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.76.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.76.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.76.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.77.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.77.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.77.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.78.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.78.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.78.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.79.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.79.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.79.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.8.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.8.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.8.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.80.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.80.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.80.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.81.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.81.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.81.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.82.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.82.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.82.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.83.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.83.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.83.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.84.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.84.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.84.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.85.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.85.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.85.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.86.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.86.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.86.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.87.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.87.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.87.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.88.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.88.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.88.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.89.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.89.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.89.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.9.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.9.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.9.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.90.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.90.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.90.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.91.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.91.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.91.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.92.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.92.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.92.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.93.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.93.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.93.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.94.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.94.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.94.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.95.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.95.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.95.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.96.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.96.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.96.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.97.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.97.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.97.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.98.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.98.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.98.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.99.down_proj.weight": "model-00042-of-00049.safetensors",
+ "model.layers.42.mlp.experts.99.gate_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.experts.99.up_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.mlp.gate.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.self_attn.k_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.self_attn.o_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.self_attn.q_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.42.self_attn.v_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.input_layernorm.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.0.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.0.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.0.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.1.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.1.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.1.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.10.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.10.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.10.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.100.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.100.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.100.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.101.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.101.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.101.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.102.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.102.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.102.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.103.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.103.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.103.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.104.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.104.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.104.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.105.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.105.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.105.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.106.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.106.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.106.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.107.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.107.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.107.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.108.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.108.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.108.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.109.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.109.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.109.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.11.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.11.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.11.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.110.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.110.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.110.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.111.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.111.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.111.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.112.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.112.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.112.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.113.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.113.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.113.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.114.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.114.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.114.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.115.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.115.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.115.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.116.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.116.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.116.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.117.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.117.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.117.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.118.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.118.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.118.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.119.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.119.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.119.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.12.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.12.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.12.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.120.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.120.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.120.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.121.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.121.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.121.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.122.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.122.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.122.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.123.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.123.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.123.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.124.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.124.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.124.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.125.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.125.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.125.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.126.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.126.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.126.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.127.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.127.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.127.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.13.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.13.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.13.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.14.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.14.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.14.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.15.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.15.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.15.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.16.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.16.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.16.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.17.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.17.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.17.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.18.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.18.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.18.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.19.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.19.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.19.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.2.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.2.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.2.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.20.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.20.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.20.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.21.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.21.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.21.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.22.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.22.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.22.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.23.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.23.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.23.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.24.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.24.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.24.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.25.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.25.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.25.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.26.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.26.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.26.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.27.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.27.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.27.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.28.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.28.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.28.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.29.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.29.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.29.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.3.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.3.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.3.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.30.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.30.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.30.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.31.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.31.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.31.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.32.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.32.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.32.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.33.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.33.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.33.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.34.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.34.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.34.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.35.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.35.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.35.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.36.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.36.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.36.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.37.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.37.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.37.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.38.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.38.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.38.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.39.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.39.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.39.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.4.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.4.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.4.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.40.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.40.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.40.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.41.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.41.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.41.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.42.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.42.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.42.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.43.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.43.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.43.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.44.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.44.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.44.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.45.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.45.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.45.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.46.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.46.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.46.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.47.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.47.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.47.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.48.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.48.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.48.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.49.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.49.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.49.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.5.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.5.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.5.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.50.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.50.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.50.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.51.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.51.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.51.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.52.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.52.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.52.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.53.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.53.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.53.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.54.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.54.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.54.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.55.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.55.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.55.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.56.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.56.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.56.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.57.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.57.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.57.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.58.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.58.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.58.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.59.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.59.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.59.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.6.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.6.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.6.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.60.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.60.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.60.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.61.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.61.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.61.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.62.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.62.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.62.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.63.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.63.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.63.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.64.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.64.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.64.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.65.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.65.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.65.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.66.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.66.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.66.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.67.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.67.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.67.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.68.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.68.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.68.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.69.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.69.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.69.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.7.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.7.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.7.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.70.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.70.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.70.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.71.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.71.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.71.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.72.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.72.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.72.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.73.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.73.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.73.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.74.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.74.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.74.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.75.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.75.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.75.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.76.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.76.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.76.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.77.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.77.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.77.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.78.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.78.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.78.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.79.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.79.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.79.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.8.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.8.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.8.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.80.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.80.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.80.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.81.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.81.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.81.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.82.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.82.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.82.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.83.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.83.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.83.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.84.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.84.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.84.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.85.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.85.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.85.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.86.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.86.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.86.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.87.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.87.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.87.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.88.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.88.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.88.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.89.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.89.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.89.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.9.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.9.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.9.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.90.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.90.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.90.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.91.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.91.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.91.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.92.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.92.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.92.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.93.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.93.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.93.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.94.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.94.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.94.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.95.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.95.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.95.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.96.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.96.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.96.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.97.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.97.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.97.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.98.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.98.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.98.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.99.down_proj.weight": "model-00043-of-00049.safetensors",
+ "model.layers.43.mlp.experts.99.gate_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.experts.99.up_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.mlp.gate.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.self_attn.k_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.self_attn.o_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.self_attn.q_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.43.self_attn.v_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.input_layernorm.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.0.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.0.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.0.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.1.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.1.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.1.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.10.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.10.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.10.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.100.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.100.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.100.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.101.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.101.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.101.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.102.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.102.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.102.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.103.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.103.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.103.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.104.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.104.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.104.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.105.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.105.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.105.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.106.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.106.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.106.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.107.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.107.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.107.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.108.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.108.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.108.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.109.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.109.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.109.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.11.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.11.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.11.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.110.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.110.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.110.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.111.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.111.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.111.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.112.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.112.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.112.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.113.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.113.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.113.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.114.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.114.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.114.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.115.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.115.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.115.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.116.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.116.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.116.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.117.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.117.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.117.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.118.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.118.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.118.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.119.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.119.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.119.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.12.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.12.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.12.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.120.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.120.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.120.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.121.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.121.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.121.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.122.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.122.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.122.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.123.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.123.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.123.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.124.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.124.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.124.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.125.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.125.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.125.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.126.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.126.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.126.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.127.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.127.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.127.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.13.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.13.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.13.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.14.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.14.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.14.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.15.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.15.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.15.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.16.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.16.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.16.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.17.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.17.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.17.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.18.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.18.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.18.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.19.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.19.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.19.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.2.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.2.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.2.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.20.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.20.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.20.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.21.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.21.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.21.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.22.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.22.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.22.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.23.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.23.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.23.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.24.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.24.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.24.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.25.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.25.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.25.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.26.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.26.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.26.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.27.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.27.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.27.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.28.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.28.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.28.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.29.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.29.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.29.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.3.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.3.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.3.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.30.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.30.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.30.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.31.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.31.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.31.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.32.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.32.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.32.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.33.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.33.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.33.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.34.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.34.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.34.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.35.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.35.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.35.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.36.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.36.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.36.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.37.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.37.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.37.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.38.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.38.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.38.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.39.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.39.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.39.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.4.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.4.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.4.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.40.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.40.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.40.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.41.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.41.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.41.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.42.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.42.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.42.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.43.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.43.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.43.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.44.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.44.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.44.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.45.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.45.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.45.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.46.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.46.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.46.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.47.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.47.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.47.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.48.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.48.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.48.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.49.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.49.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.49.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.5.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.5.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.5.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.50.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.50.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.50.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.51.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.51.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.51.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.52.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.52.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.52.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.53.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.53.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.53.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.54.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.54.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.54.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.55.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.55.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.55.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.56.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.56.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.56.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.57.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.57.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.57.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.58.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.58.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.58.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.59.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.59.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.59.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.6.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.6.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.6.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.60.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.60.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.60.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.61.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.61.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.61.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.62.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.62.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.62.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.63.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.63.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.63.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.64.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.64.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.64.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.65.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.65.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.65.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.66.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.66.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.66.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.67.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.67.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.67.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.68.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.68.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.68.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.69.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.69.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.69.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.7.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.7.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.7.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.70.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.70.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.70.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.71.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.71.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.71.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.72.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.72.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.72.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.73.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.73.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.73.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.74.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.74.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.74.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.75.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.75.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.75.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.76.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.76.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.76.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.77.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.77.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.77.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.78.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.78.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.78.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.79.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.79.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.79.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.8.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.8.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.8.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.80.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.80.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.80.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.81.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.81.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.81.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.82.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.82.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.82.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.83.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.83.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.83.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.84.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.84.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.84.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.85.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.85.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.85.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.86.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.86.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.86.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.87.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.87.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.87.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.88.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.88.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.88.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.89.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.89.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.89.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.9.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.9.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.9.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.90.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.90.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.90.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.91.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.91.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.91.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.92.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.92.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.92.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.93.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.93.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.93.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.94.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.94.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.94.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.95.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.95.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.95.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.96.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.96.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.96.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.97.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.97.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.97.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.98.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.98.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.98.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.99.down_proj.weight": "model-00044-of-00049.safetensors",
+ "model.layers.44.mlp.experts.99.gate_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.experts.99.up_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.mlp.gate.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.self_attn.k_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.self_attn.o_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.self_attn.q_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.44.self_attn.v_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.input_layernorm.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.0.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.0.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.0.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.1.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.1.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.1.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.10.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.10.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.10.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.100.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.100.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.100.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.101.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.101.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.101.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.102.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.102.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.102.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.103.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.103.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.103.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.104.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.104.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.104.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.105.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.105.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.105.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.106.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.106.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.106.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.107.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.107.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.107.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.108.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.108.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.108.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.109.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.109.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.109.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.11.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.11.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.11.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.110.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.110.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.110.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.111.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.111.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.111.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.112.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.112.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.112.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.113.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.113.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.113.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.114.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.114.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.114.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.115.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.115.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.115.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.116.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.116.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.116.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.117.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.117.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.117.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.118.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.118.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.118.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.119.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.119.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.119.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.12.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.12.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.12.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.120.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.120.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.120.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.121.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.121.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.121.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.122.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.122.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.122.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.123.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.123.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.123.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.124.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.124.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.124.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.125.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.125.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.125.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.126.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.126.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.126.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.127.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.127.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.127.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.13.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.13.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.13.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.14.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.14.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.14.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.15.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.15.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.15.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.16.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.16.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.16.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.17.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.17.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.17.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.18.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.18.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.18.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.19.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.19.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.19.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.2.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.2.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.2.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.20.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.20.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.20.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.21.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.21.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.21.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.22.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.22.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.22.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.23.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.23.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.23.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.24.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.24.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.24.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.25.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.25.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.25.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.26.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.26.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.26.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.27.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.27.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.27.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.28.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.28.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.28.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.29.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.29.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.29.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.3.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.3.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.3.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.30.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.30.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.30.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.31.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.31.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.31.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.32.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.32.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.32.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.33.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.33.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.33.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.34.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.34.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.34.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.35.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.35.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.35.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.36.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.36.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.36.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.37.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.37.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.37.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.38.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.38.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.38.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.39.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.39.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.39.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.4.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.4.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.4.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.40.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.40.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.40.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.41.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.41.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.41.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.42.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.42.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.42.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.43.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.43.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.43.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.44.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.44.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.44.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.45.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.45.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.45.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.46.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.46.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.46.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.47.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.47.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.47.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.48.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.48.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.48.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.49.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.49.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.49.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.5.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.5.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.5.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.50.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.50.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.50.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.51.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.51.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.51.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.52.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.52.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.52.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.53.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.53.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.53.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.54.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.54.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.54.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.55.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.55.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.55.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.56.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.56.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.56.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.57.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.57.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.57.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.58.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.58.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.58.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.59.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.59.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.59.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.6.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.6.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.6.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.60.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.60.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.60.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.61.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.61.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.61.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.62.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.62.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.62.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.63.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.63.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.63.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.64.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.64.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.64.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.65.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.65.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.65.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.66.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.66.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.66.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.67.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.67.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.67.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.68.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.68.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.68.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.69.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.69.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.69.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.7.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.7.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.7.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.70.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.70.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.70.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.71.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.71.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.71.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.72.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.72.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.72.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.73.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.73.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.73.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.74.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.74.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.74.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.75.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.75.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.75.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.76.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.76.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.76.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.77.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.77.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.77.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.78.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.78.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.78.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.79.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.79.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.79.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.8.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.8.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.8.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.80.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.80.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.80.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.81.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.81.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.81.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.82.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.82.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.82.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.83.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.83.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.83.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.84.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.84.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.84.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.85.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.85.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.85.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.86.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.86.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.86.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.87.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.87.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.87.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.88.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.88.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.88.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.89.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.89.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.89.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.9.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.9.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.9.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.90.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.90.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.90.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.91.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.91.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.91.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.92.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.92.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.92.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.93.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.93.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.93.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.94.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.94.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.94.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.95.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.95.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.95.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.96.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.96.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.96.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.97.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.97.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.97.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.98.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.98.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.98.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.99.down_proj.weight": "model-00045-of-00049.safetensors",
+ "model.layers.45.mlp.experts.99.gate_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.experts.99.up_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.mlp.gate.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.self_attn.k_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.self_attn.o_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.self_attn.q_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.45.self_attn.v_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.input_layernorm.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.0.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.0.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.0.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.1.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.1.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.1.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.10.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.10.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.10.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.100.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.100.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.100.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.101.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.101.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.101.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.102.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.102.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.102.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.103.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.103.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.103.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.104.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.104.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.104.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.105.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.105.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.105.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.106.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.106.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.106.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.107.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.107.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.107.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.108.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.108.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.108.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.109.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.109.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.109.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.11.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.11.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.11.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.110.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.110.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.110.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.111.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.111.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.111.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.112.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.112.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.112.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.113.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.113.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.113.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.114.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.114.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.114.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.115.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.115.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.115.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.116.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.116.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.116.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.117.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.117.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.117.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.118.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.118.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.118.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.119.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.119.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.119.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.12.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.12.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.12.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.120.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.120.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.120.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.121.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.121.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.121.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.122.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.122.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.122.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.123.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.123.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.123.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.124.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.124.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.124.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.125.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.125.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.125.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.126.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.126.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.126.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.127.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.127.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.127.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.13.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.13.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.13.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.14.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.14.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.14.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.15.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.15.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.15.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.16.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.16.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.16.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.17.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.17.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.17.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.18.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.18.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.18.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.19.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.19.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.19.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.2.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.2.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.2.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.20.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.20.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.20.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.21.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.21.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.21.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.22.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.22.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.22.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.23.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.23.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.23.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.24.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.24.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.24.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.25.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.25.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.25.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.26.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.26.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.26.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.27.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.27.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.27.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.28.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.28.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.28.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.29.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.29.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.29.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.3.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.3.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.3.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.30.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.30.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.30.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.31.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.31.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.31.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.32.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.32.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.32.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.33.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.33.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.33.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.34.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.34.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.34.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.35.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.35.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.35.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.36.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.36.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.36.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.37.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.37.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.37.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.38.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.38.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.38.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.39.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.39.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.39.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.4.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.4.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.4.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.40.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.40.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.40.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.41.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.41.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.41.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.42.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.42.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.42.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.43.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.43.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.43.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.44.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.44.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.44.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.45.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.45.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.45.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.46.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.46.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.46.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.47.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.47.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.47.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.48.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.48.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.48.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.49.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.49.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.49.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.5.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.5.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.5.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.50.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.50.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.50.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.51.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.51.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.51.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.52.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.52.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.52.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.53.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.53.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.53.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.54.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.54.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.54.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.55.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.55.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.55.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.56.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.56.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.56.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.57.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.57.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.57.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.58.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.58.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.58.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.59.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.59.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.59.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.6.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.6.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.6.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.60.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.60.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.60.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.61.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.61.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.61.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.62.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.62.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.62.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.63.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.63.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.63.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.64.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.64.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.64.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.65.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.65.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.65.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.66.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.66.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.66.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.67.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.67.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.67.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.68.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.68.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.68.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.69.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.69.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.69.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.7.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.7.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.7.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.70.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.70.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.70.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.71.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.71.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.71.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.72.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.72.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.72.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.73.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.73.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.73.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.74.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.74.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.74.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.75.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.75.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.75.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.76.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.76.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.76.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.77.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.77.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.77.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.78.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.78.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.78.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.79.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.79.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.79.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.8.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.8.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.8.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.80.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.80.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.80.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.81.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.81.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.81.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.82.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.82.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.82.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.83.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.83.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.83.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.84.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.84.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.84.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.85.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.85.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.85.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.86.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.86.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.86.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.87.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.87.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.87.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.88.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.88.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.88.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.89.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.89.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.89.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.9.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.9.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.9.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.90.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.90.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.90.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.91.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.91.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.91.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.92.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.92.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.92.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.93.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.93.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.93.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.94.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.94.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.94.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.95.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.95.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.95.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.96.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.96.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.96.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.97.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.97.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.97.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.98.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.98.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.98.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.99.down_proj.weight": "model-00046-of-00049.safetensors",
+ "model.layers.46.mlp.experts.99.gate_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.experts.99.up_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.mlp.gate.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.self_attn.k_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.self_attn.o_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.self_attn.q_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.46.self_attn.v_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.input_layernorm.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.0.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.0.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.0.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.1.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.1.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.1.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.10.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.10.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.10.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.100.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.100.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.100.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.101.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.101.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.101.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.102.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.102.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.102.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.103.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.103.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.103.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.104.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.104.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.104.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.105.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.105.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.105.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.106.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.106.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.106.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.107.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.107.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.107.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.108.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.108.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.108.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.109.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.109.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.109.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.11.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.11.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.11.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.110.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.110.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.110.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.111.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.111.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.111.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.112.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.112.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.112.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.113.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.113.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.113.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.114.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.114.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.114.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.115.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.115.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.115.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.116.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.116.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.116.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.117.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.117.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.117.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.118.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.118.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.118.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.119.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.119.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.119.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.12.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.12.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.12.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.120.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.120.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.120.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.121.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.121.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.121.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.122.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.122.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.122.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.123.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.123.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.123.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.124.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.124.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.124.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.125.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.125.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.125.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.126.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.126.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.126.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.127.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.127.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.127.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.13.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.13.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.13.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.14.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.14.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.14.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.15.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.15.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.15.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.16.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.16.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.16.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.17.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.17.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.17.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.18.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.18.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.18.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.19.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.19.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.19.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.2.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.2.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.2.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.20.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.20.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.20.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.21.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.21.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.21.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.22.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.22.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.22.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.23.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.23.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.23.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.24.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.24.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.24.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.25.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.25.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.25.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.26.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.26.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.26.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.27.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.27.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.27.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.28.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.28.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.28.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.29.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.29.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.29.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.3.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.3.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.3.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.30.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.30.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.30.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.31.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.31.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.31.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.32.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.32.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.32.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.33.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.33.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.33.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.34.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.34.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.34.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.35.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.35.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.35.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.36.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.36.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.36.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.37.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.37.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.37.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.38.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.38.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.38.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.39.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.39.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.39.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.4.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.4.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.4.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.40.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.40.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.40.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.41.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.41.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.41.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.42.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.42.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.42.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.43.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.43.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.43.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.44.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.44.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.44.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.45.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.45.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.45.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.46.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.46.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.46.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.47.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.47.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.47.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.48.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.48.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.48.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.49.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.49.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.49.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.5.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.5.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.5.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.50.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.50.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.50.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.51.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.51.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.51.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.52.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.52.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.52.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.53.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.53.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.53.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.54.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.54.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.54.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.55.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.55.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.55.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.56.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.56.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.56.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.57.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.57.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.57.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.58.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.58.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.58.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.59.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.59.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.59.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.6.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.6.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.6.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.60.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.60.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.60.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.61.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.61.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.61.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.62.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.62.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.62.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.63.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.63.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.63.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.64.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.64.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.64.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.65.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.65.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.65.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.66.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.66.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.66.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.67.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.67.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.67.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.68.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.68.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.68.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.69.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.69.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.69.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.7.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.7.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.7.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.70.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.70.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.70.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.71.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.71.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.71.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.72.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.72.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.72.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.73.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.73.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.73.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.74.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.74.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.74.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.75.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.75.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.75.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.76.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.76.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.76.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.77.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.77.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.77.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.78.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.78.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.78.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.79.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.79.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.79.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.8.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.8.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.8.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.80.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.80.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.80.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.81.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.81.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.81.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.82.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.82.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.82.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.83.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.83.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.83.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.84.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.84.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.84.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.85.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.85.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.85.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.86.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.86.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.86.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.87.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.87.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.87.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.88.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.88.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.88.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.89.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.89.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.89.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.9.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.9.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.9.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.90.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.90.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.90.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.91.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.91.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.91.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.92.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.92.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.92.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.93.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.93.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.93.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.94.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.94.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.94.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.95.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.95.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.95.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.96.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.96.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.96.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.97.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.97.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.97.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.98.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.98.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.98.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.99.down_proj.weight": "model-00047-of-00049.safetensors",
+ "model.layers.47.mlp.experts.99.gate_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.experts.99.up_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.mlp.gate.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.self_attn.k_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.self_attn.o_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.self_attn.q_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.47.self_attn.v_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.input_layernorm.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.0.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.0.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.0.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.1.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.1.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.1.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.10.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.10.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.10.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.100.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.100.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.100.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.101.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.101.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.101.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.102.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.102.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.102.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.103.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.103.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.103.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.104.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.104.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.104.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.105.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.105.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.105.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.106.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.106.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.106.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.107.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.107.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.107.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.108.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.108.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.108.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.109.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.109.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.109.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.11.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.11.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.11.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.110.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.110.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.110.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.111.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.111.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.111.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.112.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.112.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.112.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.113.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.113.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.113.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.114.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.114.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.114.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.115.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.115.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.115.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.116.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.116.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.116.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.117.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.117.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.117.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.118.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.118.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.118.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.119.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.119.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.119.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.12.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.12.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.12.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.120.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.120.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.120.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.121.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.121.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.121.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.122.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.122.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.122.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.123.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.123.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.123.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.124.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.124.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.124.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.125.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.125.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.125.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.126.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.126.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.126.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.127.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.127.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.127.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.13.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.13.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.13.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.14.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.14.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.14.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.15.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.15.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.15.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.16.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.16.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.16.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.17.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.17.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.17.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.18.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.18.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.18.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.19.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.19.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.19.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.2.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.2.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.2.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.20.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.20.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.20.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.21.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.21.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.21.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.22.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.22.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.22.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.23.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.23.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.23.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.24.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.24.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.24.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.25.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.25.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.25.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.26.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.26.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.26.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.27.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.27.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.27.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.28.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.28.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.28.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.29.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.29.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.29.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.3.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.3.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.3.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.30.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.30.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.30.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.31.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.31.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.31.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.32.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.32.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.32.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.33.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.33.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.33.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.34.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.34.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.34.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.35.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.35.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.35.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.36.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.36.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.36.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.37.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.37.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.37.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.38.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.38.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.38.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.39.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.39.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.39.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.4.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.4.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.4.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.40.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.40.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.40.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.41.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.41.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.41.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.42.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.42.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.42.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.43.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.43.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.43.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.44.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.44.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.44.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.45.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.45.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.45.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.46.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.46.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.46.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.47.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.47.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.47.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.48.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.48.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.48.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.49.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.49.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.49.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.5.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.5.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.5.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.50.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.50.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.50.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.51.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.51.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.51.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.52.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.52.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.52.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.53.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.53.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.53.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.54.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.54.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.54.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.55.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.55.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.55.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.56.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.56.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.56.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.57.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.57.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.57.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.58.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.58.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.58.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.59.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.59.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.59.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.6.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.6.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.6.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.60.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.60.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.60.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.61.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.61.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.61.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.62.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.62.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.62.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.63.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.63.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.63.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.64.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.64.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.64.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.65.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.65.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.65.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.66.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.66.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.66.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.67.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.67.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.67.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.68.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.68.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.68.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.69.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.69.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.69.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.7.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.7.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.7.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.70.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.70.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.70.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.71.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.71.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.71.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.72.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.72.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.72.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.73.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.73.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.73.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.74.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.74.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.74.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.75.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.75.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.75.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.76.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.76.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.76.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.77.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.77.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.77.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.78.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.78.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.78.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.79.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.79.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.79.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.8.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.8.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.8.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.80.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.80.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.80.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.81.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.81.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.81.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.82.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.82.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.82.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.83.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.83.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.83.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.84.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.84.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.84.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.85.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.85.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.85.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.86.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.86.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.86.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.87.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.87.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.87.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.88.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.88.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.88.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.89.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.89.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.89.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.9.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.9.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.9.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.90.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.90.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.90.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.91.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.91.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.91.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.92.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.92.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.92.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.93.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.93.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.93.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.94.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.94.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.94.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.95.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.95.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.95.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.96.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.96.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.96.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.97.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.97.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.97.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.98.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.98.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.98.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.99.down_proj.weight": "model-00048-of-00049.safetensors",
+ "model.layers.48.mlp.experts.99.gate_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.experts.99.up_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.mlp.gate.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.self_attn.k_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.self_attn.o_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.self_attn.q_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.48.self_attn.v_proj.weight": "model-00049-of-00049.safetensors",
+ "model.layers.5.input_layernorm.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.0.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.0.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.0.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.1.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.1.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.1.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.10.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.10.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.10.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.100.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.100.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.100.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.101.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.101.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.101.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.102.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.102.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.102.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.103.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.103.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.103.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.104.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.104.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.104.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.105.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.105.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.105.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.106.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.106.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.106.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.107.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.107.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.107.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.108.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.108.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.108.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.109.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.109.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.109.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.11.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.11.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.11.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.110.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.110.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.110.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.111.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.111.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.111.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.112.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.112.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.112.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.113.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.113.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.113.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.114.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.114.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.114.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.115.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.115.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.115.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.116.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.116.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.116.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.117.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.117.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.117.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.118.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.118.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.118.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.119.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.119.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.119.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.12.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.12.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.12.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.120.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.120.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.120.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.121.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.121.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.121.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.122.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.122.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.122.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.123.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.123.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.123.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.124.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.124.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.124.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.125.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.125.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.125.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.126.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.126.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.126.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.127.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.127.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.127.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.13.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.13.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.13.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.14.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.14.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.14.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.15.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.15.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.15.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.16.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.16.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.16.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.17.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.17.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.17.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.18.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.18.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.18.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.19.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.19.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.19.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.2.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.2.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.2.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.20.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.20.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.20.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.21.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.21.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.21.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.22.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.22.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.22.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.23.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.23.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.23.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.24.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.24.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.24.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.25.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.25.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.25.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.26.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.26.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.26.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.27.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.27.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.27.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.28.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.28.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.28.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.29.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.29.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.29.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.3.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.3.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.3.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.30.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.30.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.30.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.31.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.31.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.31.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.32.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.32.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.32.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.33.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.33.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.33.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.34.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.34.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.34.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.35.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.35.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.35.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.36.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.36.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.36.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.37.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.37.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.37.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.38.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.38.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.38.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.39.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.39.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.39.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.4.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.4.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.4.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.40.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.40.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.40.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.41.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.41.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.41.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.42.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.42.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.42.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.43.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.43.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.43.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.44.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.44.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.44.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.45.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.45.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.45.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.46.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.46.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.46.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.47.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.47.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.47.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.48.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.48.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.48.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.49.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.49.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.49.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.5.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.5.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.5.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.50.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.50.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.50.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.51.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.51.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.51.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.52.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.52.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.52.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.53.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.53.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.53.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.54.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.54.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.54.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.55.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.55.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.55.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.56.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.56.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.56.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.57.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.57.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.57.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.58.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.58.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.58.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.59.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.59.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.59.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.6.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.6.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.6.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.60.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.60.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.60.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.61.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.61.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.61.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.62.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.62.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.62.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.63.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.63.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.63.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.64.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.64.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.64.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.65.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.65.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.65.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.66.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.66.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.66.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.67.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.67.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.67.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.68.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.68.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.68.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.69.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.69.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.69.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.7.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.7.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.7.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.70.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.70.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.70.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.71.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.71.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.71.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.72.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.72.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.72.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.73.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.73.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.73.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.74.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.74.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.74.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.75.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.75.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.75.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.76.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.76.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.76.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.77.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.77.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.77.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.78.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.78.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.78.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.79.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.79.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.79.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.8.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.8.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.8.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.80.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.80.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.80.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.81.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.81.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.81.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.82.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.82.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.82.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.83.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.83.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.83.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.84.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.84.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.84.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.85.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.85.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.85.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.86.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.86.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.86.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.87.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.87.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.87.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.88.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.88.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.88.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.89.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.89.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.89.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.9.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.9.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.9.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.90.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.90.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.90.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.91.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.91.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.91.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.92.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.92.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.92.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.93.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.93.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.93.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.94.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.94.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.94.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.95.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.95.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.95.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.96.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.96.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.96.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.97.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.97.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.97.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.98.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.98.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.98.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.99.down_proj.weight": "model-00005-of-00049.safetensors",
+ "model.layers.5.mlp.experts.99.gate_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.experts.99.up_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.mlp.gate.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.self_attn.k_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.self_attn.o_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.self_attn.q_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.5.self_attn.v_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.input_layernorm.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.0.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.0.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.0.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.1.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.1.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.1.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.10.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.10.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.10.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.100.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.100.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.100.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.101.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.101.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.101.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.102.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.102.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.102.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.103.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.103.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.103.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.104.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.104.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.104.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.105.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.105.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.105.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.106.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.106.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.106.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.107.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.107.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.107.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.108.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.108.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.108.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.109.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.109.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.109.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.11.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.11.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.11.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.110.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.110.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.110.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.111.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.111.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.111.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.112.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.112.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.112.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.113.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.113.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.113.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.114.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.114.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.114.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.115.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.115.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.115.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.116.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.116.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.116.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.117.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.117.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.117.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.118.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.118.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.118.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.119.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.119.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.119.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.12.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.12.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.12.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.120.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.120.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.120.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.121.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.121.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.121.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.122.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.122.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.122.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.123.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.123.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.123.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.124.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.124.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.124.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.125.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.125.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.125.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.126.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.126.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.126.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.127.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.127.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.127.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.13.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.13.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.13.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.14.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.14.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.14.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.15.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.15.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.15.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.16.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.16.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.16.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.17.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.17.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.17.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.18.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.18.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.18.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.19.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.19.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.19.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.2.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.2.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.2.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.20.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.20.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.20.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.21.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.21.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.21.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.22.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.22.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.22.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.23.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.23.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.23.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.24.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.24.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.24.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.25.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.25.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.25.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.26.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.26.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.26.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.27.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.27.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.27.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.28.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.28.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.28.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.29.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.29.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.29.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.3.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.3.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.3.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.30.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.30.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.30.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.31.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.31.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.31.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.32.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.32.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.32.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.33.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.33.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.33.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.34.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.34.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.34.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.35.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.35.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.35.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.36.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.36.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.36.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.37.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.37.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.37.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.38.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.38.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.38.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.39.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.39.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.39.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.4.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.4.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.4.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.40.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.40.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.40.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.41.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.41.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.41.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.42.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.42.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.42.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.43.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.43.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.43.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.44.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.44.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.44.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.45.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.45.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.45.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.46.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.46.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.46.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.47.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.47.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.47.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.48.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.48.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.48.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.49.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.49.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.49.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.5.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.5.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.5.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.50.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.50.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.50.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.51.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.51.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.51.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.52.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.52.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.52.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.53.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.53.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.53.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.54.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.54.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.54.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.55.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.55.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.55.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.56.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.56.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.56.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.57.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.57.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.57.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.58.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.58.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.58.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.59.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.59.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.59.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.6.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.6.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.6.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.60.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.60.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.60.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.61.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.61.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.61.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.62.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.62.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.62.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.63.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.63.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.63.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.64.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.64.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.64.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.65.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.65.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.65.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.66.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.66.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.66.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.67.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.67.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.67.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.68.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.68.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.68.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.69.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.69.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.69.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.7.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.7.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.7.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.70.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.70.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.70.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.71.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.71.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.71.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.72.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.72.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.72.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.73.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.73.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.73.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.74.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.74.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.74.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.75.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.75.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.75.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.76.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.76.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.76.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.77.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.77.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.77.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.78.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.78.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.78.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.79.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.79.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.79.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.8.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.8.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.8.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.80.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.80.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.80.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.81.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.81.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.81.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.82.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.82.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.82.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.83.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.83.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.83.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.84.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.84.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.84.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.85.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.85.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.85.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.86.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.86.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.86.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.87.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.87.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.87.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.88.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.88.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.88.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.89.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.89.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.89.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.9.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.9.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.9.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.90.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.90.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.90.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.91.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.91.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.91.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.92.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.92.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.92.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.93.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.93.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.93.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.94.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.94.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.94.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.95.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.95.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.95.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.96.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.96.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.96.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.97.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.97.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.97.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.98.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.98.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.98.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.99.down_proj.weight": "model-00006-of-00049.safetensors",
+ "model.layers.6.mlp.experts.99.gate_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.experts.99.up_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.mlp.gate.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.self_attn.k_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.self_attn.o_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.self_attn.q_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.6.self_attn.v_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.input_layernorm.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.0.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.0.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.0.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.1.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.1.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.1.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.10.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.10.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.10.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.100.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.100.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.100.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.101.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.101.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.101.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.102.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.102.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.102.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.103.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.103.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.103.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.104.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.104.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.104.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.105.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.105.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.105.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.106.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.106.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.106.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.107.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.107.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.107.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.108.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.108.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.108.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.109.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.109.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.109.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.11.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.11.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.11.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.110.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.110.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.110.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.111.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.111.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.111.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.112.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.112.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.112.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.113.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.113.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.113.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.114.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.114.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.114.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.115.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.115.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.115.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.116.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.116.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.116.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.117.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.117.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.117.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.118.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.118.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.118.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.119.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.119.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.119.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.12.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.12.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.12.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.120.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.120.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.120.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.121.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.121.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.121.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.122.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.122.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.122.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.123.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.123.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.123.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.124.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.124.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.124.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.125.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.125.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.125.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.126.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.126.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.126.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.127.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.127.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.127.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.13.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.13.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.13.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.14.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.14.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.14.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.15.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.15.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.15.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.16.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.16.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.16.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.17.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.17.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.17.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.18.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.18.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.18.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.19.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.19.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.19.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.2.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.2.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.2.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.20.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.20.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.20.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.21.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.21.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.21.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.22.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.22.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.22.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.23.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.23.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.23.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.24.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.24.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.24.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.25.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.25.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.25.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.26.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.26.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.26.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.27.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.27.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.27.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.28.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.28.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.28.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.29.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.29.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.29.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.3.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.3.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.3.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.30.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.30.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.30.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.31.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.31.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.31.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.32.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.32.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.32.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.33.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.33.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.33.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.34.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.34.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.34.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.35.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.35.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.35.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.36.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.36.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.36.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.37.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.37.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.37.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.38.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.38.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.38.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.39.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.39.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.39.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.4.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.4.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.4.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.40.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.40.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.40.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.41.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.41.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.41.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.42.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.42.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.42.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.43.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.43.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.43.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.44.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.44.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.44.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.45.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.45.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.45.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.46.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.46.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.46.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.47.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.47.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.47.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.48.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.48.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.48.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.49.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.49.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.49.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.5.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.5.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.5.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.50.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.50.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.50.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.51.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.51.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.51.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.52.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.52.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.52.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.53.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.53.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.53.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.54.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.54.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.54.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.55.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.55.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.55.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.56.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.56.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.56.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.57.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.57.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.57.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.58.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.58.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.58.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.59.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.59.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.59.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.6.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.6.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.6.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.60.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.60.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.60.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.61.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.61.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.61.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.62.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.62.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.62.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.63.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.63.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.63.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.64.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.64.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.64.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.65.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.65.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.65.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.66.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.66.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.66.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.67.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.67.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.67.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.68.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.68.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.68.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.69.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.69.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.69.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.7.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.7.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.7.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.70.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.70.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.70.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.71.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.71.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.71.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.72.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.72.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.72.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.73.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.73.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.73.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.74.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.74.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.74.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.75.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.75.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.75.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.76.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.76.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.76.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.77.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.77.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.77.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.78.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.78.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.78.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.79.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.79.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.79.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.8.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.8.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.8.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.80.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.80.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.80.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.81.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.81.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.81.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.82.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.82.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.82.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.83.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.83.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.83.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.84.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.84.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.84.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.85.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.85.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.85.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.86.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.86.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.86.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.87.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.87.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.87.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.88.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.88.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.88.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.89.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.89.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.89.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.9.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.9.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.9.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.90.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.90.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.90.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.91.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.91.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.91.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.92.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.92.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.92.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.93.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.93.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.93.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.94.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.94.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.94.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.95.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.95.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.95.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.96.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.96.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.96.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.97.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.97.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.97.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.98.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.98.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.98.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.99.down_proj.weight": "model-00007-of-00049.safetensors",
+ "model.layers.7.mlp.experts.99.gate_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.experts.99.up_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.mlp.gate.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.self_attn.k_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.self_attn.o_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.self_attn.q_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.7.self_attn.v_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.input_layernorm.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.0.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.0.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.0.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.1.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.1.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.1.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.10.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.10.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.10.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.100.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.100.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.100.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.101.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.101.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.101.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.102.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.102.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.102.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.103.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.103.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.103.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.104.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.104.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.104.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.105.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.105.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.105.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.106.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.106.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.106.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.107.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.107.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.107.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.108.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.108.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.108.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.109.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.109.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.109.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.11.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.11.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.11.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.110.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.110.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.110.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.111.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.111.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.111.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.112.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.112.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.112.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.113.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.113.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.113.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.114.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.114.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.114.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.115.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.115.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.115.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.116.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.116.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.116.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.117.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.117.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.117.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.118.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.118.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.118.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.119.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.119.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.119.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.12.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.12.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.12.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.120.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.120.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.120.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.121.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.121.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.121.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.122.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.122.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.122.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.123.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.123.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.123.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.124.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.124.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.124.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.125.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.125.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.125.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.126.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.126.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.126.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.127.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.127.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.127.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.13.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.13.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.13.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.14.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.14.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.14.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.15.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.15.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.15.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.16.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.16.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.16.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.17.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.17.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.17.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.18.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.18.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.18.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.19.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.19.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.19.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.2.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.2.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.2.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.20.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.20.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.20.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.21.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.21.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.21.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.22.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.22.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.22.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.23.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.23.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.23.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.24.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.24.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.24.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.25.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.25.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.25.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.26.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.26.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.26.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.27.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.27.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.27.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.28.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.28.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.28.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.29.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.29.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.29.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.3.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.3.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.3.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.30.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.30.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.30.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.31.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.31.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.31.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.32.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.32.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.32.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.33.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.33.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.33.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.34.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.34.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.34.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.35.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.35.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.35.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.36.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.36.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.36.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.37.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.37.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.37.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.38.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.38.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.38.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.39.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.39.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.39.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.4.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.4.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.4.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.40.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.40.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.40.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.41.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.41.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.41.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.42.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.42.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.42.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.43.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.43.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.43.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.44.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.44.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.44.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.45.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.45.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.45.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.46.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.46.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.46.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.47.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.47.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.47.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.48.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.48.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.48.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.49.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.49.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.49.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.5.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.5.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.5.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.50.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.50.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.50.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.51.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.51.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.51.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.52.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.52.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.52.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.53.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.53.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.53.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.54.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.54.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.54.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.55.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.55.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.55.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.56.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.56.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.56.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.57.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.57.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.57.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.58.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.58.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.58.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.59.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.59.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.59.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.6.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.6.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.6.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.60.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.60.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.60.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.61.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.61.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.61.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.62.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.62.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.62.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.63.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.63.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.63.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.64.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.64.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.64.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.65.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.65.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.65.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.66.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.66.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.66.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.67.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.67.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.67.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.68.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.68.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.68.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.69.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.69.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.69.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.7.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.7.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.7.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.70.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.70.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.70.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.71.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.71.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.71.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.72.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.72.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.72.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.73.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.73.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.73.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.74.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.74.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.74.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.75.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.75.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.75.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.76.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.76.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.76.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.77.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.77.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.77.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.78.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.78.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.78.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.79.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.79.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.79.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.8.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.8.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.8.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.80.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.80.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.80.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.81.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.81.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.81.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.82.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.82.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.82.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.83.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.83.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.83.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.84.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.84.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.84.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.85.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.85.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.85.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.86.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.86.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.86.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.87.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.87.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.87.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.88.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.88.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.88.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.89.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.89.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.89.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.9.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.9.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.9.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.90.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.90.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.90.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.91.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.91.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.91.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.92.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.92.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.92.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.93.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.93.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.93.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.94.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.94.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.94.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.95.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.95.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.95.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.96.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.96.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.96.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.97.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.97.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.97.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.98.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.98.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.98.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.99.down_proj.weight": "model-00008-of-00049.safetensors",
+ "model.layers.8.mlp.experts.99.gate_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.experts.99.up_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.mlp.gate.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.self_attn.k_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.self_attn.o_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.self_attn.q_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.8.self_attn.v_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.input_layernorm.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.0.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.0.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.0.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.1.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.1.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.1.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.10.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.10.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.10.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.100.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.100.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.100.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.101.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.101.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.101.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.102.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.102.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.102.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.103.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.103.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.103.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.104.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.104.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.104.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.105.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.105.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.105.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.106.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.106.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.106.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.107.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.107.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.107.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.108.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.108.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.108.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.109.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.109.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.109.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.11.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.11.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.11.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.110.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.110.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.110.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.111.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.111.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.111.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.112.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.112.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.112.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.113.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.113.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.113.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.114.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.114.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.114.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.115.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.115.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.115.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.116.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.116.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.116.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.117.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.117.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.117.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.118.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.118.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.118.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.119.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.119.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.119.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.12.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.12.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.12.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.120.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.120.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.120.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.121.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.121.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.121.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.122.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.122.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.122.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.123.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.123.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.123.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.124.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.124.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.124.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.125.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.125.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.125.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.126.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.126.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.126.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.127.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.127.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.127.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.13.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.13.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.13.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.14.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.14.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.14.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.15.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.15.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.15.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.16.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.16.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.16.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.17.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.17.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.17.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.18.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.18.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.18.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.19.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.19.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.19.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.2.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.2.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.2.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.20.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.20.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.20.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.21.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.21.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.21.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.22.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.22.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.22.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.23.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.23.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.23.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.24.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.24.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.24.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.25.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.25.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.25.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.26.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.26.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.26.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.27.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.27.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.27.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.28.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.28.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.28.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.29.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.29.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.29.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.3.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.3.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.3.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.30.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.30.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.30.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.31.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.31.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.31.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.32.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.32.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.32.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.33.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.33.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.33.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.34.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.34.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.34.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.35.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.35.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.35.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.36.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.36.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.36.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.37.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.37.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.37.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.38.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.38.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.38.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.39.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.39.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.39.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.4.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.4.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.4.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.40.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.40.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.40.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.41.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.41.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.41.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.42.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.42.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.42.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.43.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.43.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.43.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.44.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.44.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.44.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.45.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.45.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.45.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.46.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.46.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.46.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.47.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.47.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.47.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.48.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.48.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.48.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.49.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.49.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.49.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.5.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.5.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.5.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.50.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.50.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.50.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.51.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.51.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.51.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.52.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.52.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.52.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.53.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.53.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.53.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.54.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.54.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.54.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.55.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.55.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.55.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.56.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.56.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.56.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.57.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.57.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.57.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.58.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.58.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.58.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.59.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.59.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.59.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.6.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.6.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.6.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.60.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.60.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.60.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.61.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.61.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.61.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.62.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.62.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.62.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.63.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.63.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.63.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.64.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.64.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.64.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.65.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.65.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.65.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.66.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.66.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.66.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.67.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.67.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.67.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.68.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.68.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.68.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.69.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.69.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.69.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.7.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.7.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.7.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.70.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.70.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.70.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.71.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.71.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.71.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.72.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.72.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.72.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.73.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.73.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.73.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.74.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.74.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.74.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.75.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.75.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.75.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.76.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.76.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.76.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.77.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.77.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.77.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.78.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.78.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.78.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.79.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.79.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.79.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.8.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.8.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.8.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.80.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.80.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.80.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.81.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.81.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.81.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.82.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.82.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.82.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.83.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.83.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.83.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.84.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.84.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.84.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.85.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.85.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.85.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.86.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.86.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.86.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.87.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.87.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.87.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.88.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.88.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.88.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.89.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.89.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.89.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.9.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.9.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.9.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.90.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.90.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.90.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.91.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.91.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.91.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.92.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.92.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.92.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.93.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.93.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.93.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.94.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.94.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.94.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.95.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.95.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.95.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.96.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.96.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.96.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.97.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.97.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.97.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.98.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.98.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.98.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.99.down_proj.weight": "model-00009-of-00049.safetensors",
+ "model.layers.9.mlp.experts.99.gate_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.experts.99.up_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.mlp.gate.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.self_attn.k_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.self_attn.o_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.self_attn.q_proj.weight": "model-00010-of-00049.safetensors",
+ "model.layers.9.self_attn.v_proj.weight": "model-00010-of-00049.safetensors",
+ "model.norm.weight": "model-00049-of-00049.safetensors"
+ }
+}
diff --git a/special_tokens_map.json b/special_tokens_map.json
new file mode 100644
index 0000000000000000000000000000000000000000..7d90b1a7abc0c8c5e3da8c11d6aab610a7a8dea0
--- /dev/null
+++ b/special_tokens_map.json
@@ -0,0 +1,30 @@
+{
+ "bos_token": {
+ "content": "",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false
+ },
+ "eos_token": {
+ "content": "<|END_OF_TURN_TOKEN|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false
+ },
+ "pad_token": {
+ "content": "",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false
+ },
+ "unk_token": {
+ "content": "",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false
+ }
+}
\ No newline at end of file
diff --git a/tokenizer.json b/tokenizer.json
new file mode 100644
index 0000000000000000000000000000000000000000..a8680c4bce4114a529aaa37430b3af664ce2b7ef
--- /dev/null
+++ b/tokenizer.json
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a17e995a435e5ddc664625bc76b760d8da5301f6e17d6eefdac2d6605685796a
+size 28217461
diff --git a/tokenizer_config.json b/tokenizer_config.json
new file mode 100644
index 0000000000000000000000000000000000000000..04d772a5bfd8e0dc6f7e701ea0fbaa7a3b80eba0
--- /dev/null
+++ b/tokenizer_config.json
@@ -0,0 +1,328 @@
+{
+ "add_bos_token": true,
+ "add_eos_token": false,
+ "add_prefix_space": false,
+ "clean_up_tokenization_spaces": false,
+ "legacy": true,
+ "spaces_between_special_tokens": false,
+ "use_default_system_prompt": false,
+ "bos_token": "",
+ "eos_token": "<|END_OF_TURN_TOKEN|>",
+ "pad_token": "",
+ "unk_token": "",
+ "tokenizer_class": "TokenizersBackend",
+ "model_max_length": 1000000000000000019884624838656,
+ "sp_model_kwargs": {},
+ "chat_template": [
+ {
+ "name": "default",
+ "template": "{{ bos_token }}{% if documents %}\n{% set tools = [] %}\n{%- macro document_turn(documents) -%}\n{# format documents into chat turn #}\n<|START_OF_TURN_TOKEN|><|CHATBOT_TOKEN|><|START_THINKING|>I will look through the document to address the users needs.<|END_THINKING|><|START_ACTION|>[\n {\"tool_call_id\": \"0\", \"tool_name\": \"direct-injected-document\", \"parameters\": {}}\n]<|END_ACTION|><|END_OF_TURN_TOKEN|><|START_OF_TURN_TOKEN|><|SYSTEM_TOKEN|><|START_TOOL_RESULT|>[\n {\n \"tool_call_id\": \"0\",\n \"results\": {\n{% for doc in documents %}\n \"{{ loop.index0 }}\": {{doc|tojson}}{% if not loop.last %},\n {% endif %}\n{% endfor %}\n\n },\n \"is_error\": null\n }\n]<|END_TOOL_RESULT|><|END_OF_TURN_TOKEN|>{%- endmacro %}\n{%- macro tool_call_id_to_int(messages, tool_call_id) %}\n{%- set counter = namespace(value=0) %}\n{%- set tool_call_id_seen = namespace(value=false) %}\n{%- for msg in messages %}\n {%- if msg.tool_calls %}\n {%- for tool_call in msg.tool_calls %}\n {%- if tool_call.id == tool_call_id and not tool_call_id_seen.value -%}\n {{ counter.value }}\n {%- set tool_call_id_seen.value = true %}\n {%- endif %}\n {%- set counter.value = counter.value + 1 %}\n {%- endfor %}\n {%- endif %}\n{%- endfor %}\n{%- endmacro %}\n{%- macro format_tool_message(messages, tool_msg) -%}\n{# format tool message #}\n {\n \"tool_call_id\": \"{{ tool_call_id_to_int(messages, tool_msg.tool_call_id) }}\",\n \"results\": {\n \"0\": {{ tool_msg.content|tojson }}\n },\n \"is_error\": null\n }\n{%- endmacro -%}\n{%- if messages and messages[0]['role']|lower == 'system' %}{%- set developer_preamble = messages[0]['content'] %}{% endif %}\n{%- set tool_idx = namespace(value=0) %}\n{%- set tool_ids_seen = namespace(value=[]) %}\n{%- set sent_documents = namespace(value=false) %}\n<|START_OF_TURN_TOKEN|><|SYSTEM_TOKEN|># System Preamble\nYou are in contextual safety mode. You will reject requests to generate child sexual abuse material and child exploitation material in your responses. You will accept to provide information and creative content related to violence, hate, misinformation or sex, but you will not provide any content that could directly or indirectly lead to harmful outcomes.\n\nYour information cutoff date is June 2024.\n\nYou have been trained on data in English, French, Spanish, Italian, German, Portuguese, Japanese, Korean, Modern Standard Arabic, Mandarin, Russian, Indonesian, Turkish, Dutch, Polish, Persian, Vietnamese, Czech, Hindi, Ukrainian, Romanian, Greek and Hebrew but have the ability to speak many more languages.\n{% if tools or documents %}\n\nYou have been trained to have advanced reasoning and tool-use capabilities and you should make best use of these skills to serve user's requests.\n\n## Tool Use\nThink about how you can make best use of the provided tools to help with the task and come up with a high level plan that you will execute first.\n\n0. Start by writing <|START_THINKING|> followed by a detailed step by step plan of how you will solve the problem. For each step explain your thinking fully and give details of required tool calls (if needed). Unless specified otherwise, you write your plan in natural language. When you finish, close it out with <|END_THINKING|>.\n You can optionally choose to skip this step when the user request is so straightforward to address that only a trivial plan would be needed.\n NOTE: You MUST skip this step when you are directly responding to the user's request without using any tools.\n\nThen carry out your plan by repeatedly executing the following steps.\n1. Action: write <|START_ACTION|> followed by a list of JSON-formatted tool calls, with each one containing \"tool_name\" and \"parameters\" fields.\n When there are multiple tool calls which are completely independent of each other (i.e. they can be executed in parallel), you should list them out all together in one step. When you finish, close it out with <|END_ACTION|>.\n2. Observation: you will then receive results of those tool calls in JSON format in the very next turn, wrapped around by <|START_TOOL_RESULT|> and <|END_TOOL_RESULT|>. Carefully observe those results and think about what to do next. Note that these results will be provided to you in a separate turn. NEVER hallucinate results.\n Every tool call produces a list of results (when a tool call produces no result or a single result, it'll still get wrapped inside a list). Each result is clearly linked to its originating tool call via its \"tool_call_id\".\n3. Reflection: start the next turn by writing <|START_THINKING|> followed by what you've figured out so far, any changes you need to make to your plan, and what you will do next. When you finish, close it out with <|END_THINKING|>.\n You can optionally choose to skip this step when everything is going according to plan and no special pieces of information or reasoning chains need to be recorded.\n NOTE: You MUST skip this step when you are done with tool-use actions and are ready to respond to the user.\n\nYou can repeat the above 3 steps multiple times (could be 0 times too if no suitable tool calls are available or needed), until you decide it's time to finally respond to the user.\n\n4. Response: then break out of the loop and write <|START_RESPONSE|> followed by a piece of text which serves as a response to the user's last request. Use all previous tool calls and results to help you when formulating your response. When you finish, close it out with <|END_RESPONSE|>.\n{% if enable_citations %}\n\n## Grounding\nImportantly, note that \"Reflection\" and \"Response\" above can be grounded.\nGrounding means you associate pieces of texts (called \"spans\") with those specific tool results that support them (called \"sources\"). And you use a pair of tags \"\" and \"\" to indicate when a span can be grounded onto a list of sources, listing them out in the closing tag. Sources from the same tool call are grouped together and listed as \"{tool_call_id}:[{list of result indices}]\", before they are joined together by \",\". E.g., \"span\" means that \"span\" is supported by result 1 and 2 from \"tool_call_id=0\" as well as result 0 from \"tool_call_id=1\".\n{% endif %}\n\n## Available Tools\nHere is the list of tools that you have available to you.\nYou can ONLY use the tools listed here. When a tool is not listed below, it is NOT available and you should NEVER attempt to use it.\nEach tool is represented as a JSON object with fields like \"name\", \"description\", \"parameters\" (per JSON Schema), and optionally, \"responses\" (per JSON Schema).\n\n```json\n[\n{% if documents %}\n {\"name\": \"direct-injected-document\", \"description\": \"This is a special tool to directly inject user-uploaded documents into the chat as additional context. DO NOT use this tool by yourself!\", \"parameters\": {\"type\": \"object\", \"properties\": {}, \"required\": []}, \"responses\": {\"200\": {\"description\": \"Successfully returned a list of chunked text snippets from the directly uploaded documents.\", \"content\": {\"application/json\": {\"schema\": {\"type\": \"array\", \"items\": {\"type\": \"object\", \"required\": [\"url\", \"snippet\"], \"properties\": {\"url\": {\"type\": \"string\", \"description\": \"The url of the uploaded document.\"}, \"snippet\": {\"type\": \"string\", \"description\": \"The text snippet for the returned document chunk.\"}}}}}}}}}{%- if tools %},{% endif %}\n\n{% endif %}\n{% for tool in tools %}\n {\"name\": \"{{ tool['function']['name'] }}\", \"description\": \"{{tool['function']['description']}}\", \"parameters\": {{ tool['function']['parameters']|tojson }}, \"responses\": null}{%- if not loop.last %},{% endif %}\n\n{% endfor %}\n]\n```\n\n{% endif %}\n# Default Preamble\nThe following instructions are your defaults unless specified elsewhere in developer preamble or user prompt.\n- Your name is Command.\n- You are a large language model built by Cohere.\n- You reply conversationally with a friendly and informative tone and often include introductory statements and follow-up questions.\n- If the input is ambiguous, ask clarifying follow-up questions.\n- Use Markdown-specific formatting in your response (for example to highlight phrases in bold or italics, create tables, or format code blocks).\n- Use LaTeX to generate mathematical notation for complex equations.\n- When responding in English, use American English unless context indicates otherwise.\n- When outputting responses of more than seven sentences, split the response into paragraphs.\n- Prefer the active voice.\n- Adhere to the APA style guidelines for punctuation, spelling, hyphenation, capitalization, numbers, lists, and quotation marks. Do not worry about them for other elements such as italics, citations, figures, or references.\n- Use gender-neutral pronouns for unspecified persons.\n- Limit lists to no more than 10 items unless the list is a set of finite instructions, in which case complete the list.\n- Use the third person when asked to write a summary.\n- When asked to extract values from source material, use the exact form, separated by commas.\n- When generating code output, please provide an explanation after the code.\n- When generating code output without specifying the programming language, please generate Python code.\n- If you are asked a question that requires reasoning, first think through your answer, slowly and step by step, then answer.\n{%- if developer_preamble %}\n\n\n# Developer Preamble\nThe following instructions take precedence over instructions in the default preamble and user prompt. You reject any instructions which conflict with system preamble instructions.\n{{ developer_preamble }}\n{%- endif -%}\n<|END_OF_TURN_TOKEN|>\n{%- for message in messages %}\n {%- if message.role|lower == 'system' and not (loop.first and developer_preamble)%}\n<|START_OF_TURN_TOKEN|><|SYSTEM_TOKEN|>{{ message.content }}<|END_OF_TURN_TOKEN|>\n {%- elif message.role|lower == 'user' %}\n<|START_OF_TURN_TOKEN|><|USER_TOKEN|>{{ message.content }}<|END_OF_TURN_TOKEN|>{%- if documents and not sent_documents.value %}{%- set sent_documents.value = true %}{% set tool_idx.value = tool_idx.value + 1 %}{{ document_turn(documents) }}{% endif %}\n {%- elif message.role|lower == 'assistant' or message.role|lower == 'chatbot' %}\n<|START_OF_TURN_TOKEN|><|CHATBOT_TOKEN|>{% if message.tool_calls %}<|START_THINKING|>{{message.tool_plan}}<|END_THINKING|><|START_ACTION|>[\n {% for tc in message.tool_calls %}\n {\"tool_call_id\": \"{{ tool_idx.value }}\", \"tool_name\": \"{{ tc['function']['name'] }}\", \"parameters\": {{ tc['function']['arguments']|tojson }}}{% if not loop.last %},{% endif %}\n\n {% set tool_idx.value = tool_idx.value + 1 %}\n {% endfor %}\n]<|END_ACTION|><|END_OF_TURN_TOKEN|>{% else %}<|START_RESPONSE|>{{message.content}}<|END_RESPONSE|><|END_OF_TURN_TOKEN|>{% endif %}\n {% elif message.role|lower == 'tool' and message.tool_call_id not in tool_ids_seen.value %}\n<|START_OF_TURN_TOKEN|><|SYSTEM_TOKEN|><|START_TOOL_RESULT|>[\n{{ format_tool_message(messages, message) }}\n {%- for msg in messages[loop.index0 + 1:] %}\n {%- if msg.role|lower == 'tool' %},\n{{ format_tool_message(messages, msg) }}\n {%- set tool_ids_seen.value = tool_ids_seen.value + [msg.tool_call_id] %}\n {%- else %}\n {%- break %}\n {%- endif %}\n {%- endfor %}\n\n]<|END_TOOL_RESULT|><|END_OF_TURN_TOKEN|>\n {%- endif %}\n{%- endfor %}<|START_OF_TURN_TOKEN|><|CHATBOT_TOKEN|>\n{%- else -%}\n{%- if messages and messages[0]['role']|lower == 'system' %}{%- set developer_preamble = messages[0]['content'] %}{% endif %}\n<|START_OF_TURN_TOKEN|><|SYSTEM_TOKEN|># System Preamble\n{% if safety_mode|upper == 'STRICT' -%}\nYou are in strict safety mode. You will reject requests to generate child sexual abuse material and child exploitation material in your responses. You will reject requests to generate content related to violence, hate, misinformation or sex to any amount. You will avoid using profanity. You will not provide users with instructions to perform regulated, controlled or illegal activities.\n{%- else -%}\nYou are in contextual safety mode. You will reject requests to generate child sexual abuse material and child exploitation material in your responses. You will accept to provide information and creative content related to violence, hate, misinformation or sex, but you will not provide any content that could directly or indirectly lead to harmful outcomes.\n{%- endif %}\n\n\nYour information cutoff date is June 2024.\n\nYou have been trained on data in English, French, Spanish, Italian, German, Portuguese, Japanese, Korean, Modern Standard Arabic, Mandarin, Russian, Indonesian, Turkish, Dutch, Polish, Persian, Vietnamese, Czech, Hindi, Ukrainian, Romanian, Greek and Hebrew but have the ability to speak many more languages.\n\n# Default Preamble\nThe following instructions are your defaults unless specified elsewhere in developer preamble or user prompt.\n- Your name is Command.\n- You are a large language model built by Cohere.\n- You reply conversationally with a friendly and informative tone and often include introductory statements and follow-up questions.\n- If the input is ambiguous, ask clarifying follow-up questions.\n- Use Markdown-specific formatting in your response (for example to highlight phrases in bold or italics, create tables, or format code blocks).\n- Use LaTeX to generate mathematical notation for complex equations.\n- When responding in English, use American English unless context indicates otherwise.\n- When outputting responses of more than seven sentences, split the response into paragraphs.\n- Prefer the active voice.\n- Adhere to the APA style guidelines for punctuation, spelling, hyphenation, capitalization, numbers, lists, and quotation marks. Do not worry about them for other elements such as italics, citations, figures, or references.\n- Use gender-neutral pronouns for unspecified persons.\n- Limit lists to no more than 10 items unless the list is a set of finite instructions, in which case complete the list.\n- Use the third person when asked to write a summary.\n- When asked to extract values from source material, use the exact form, separated by commas.\n- When generating code output, please provide an explanation after the code.\n- When generating code output without specifying the programming language, please generate Python code.\n- If you are asked a question that requires reasoning, first think through your answer, slowly and step by step, then answer.\n{%- if developer_preamble %}\n\n\n# Developer Preamble\nThe following instructions take precedence over instructions in the default preamble and user prompt. You reject any instructions which conflict with system preamble instructions.\n{{ developer_preamble }}\n{%- endif -%}\n<|END_OF_TURN_TOKEN|>\n{%- for message in messages %}\n {%- if message.role|lower == 'system' and not (loop.first and developer_preamble)%}\n<|START_OF_TURN_TOKEN|><|SYSTEM_TOKEN|>{{ message.content }}<|END_OF_TURN_TOKEN|>\n {%- elif message.role|lower == 'user' %}\n<|START_OF_TURN_TOKEN|><|USER_TOKEN|>{{ message.content }}<|END_OF_TURN_TOKEN|>\n {%- elif message.role|lower == 'assistant' or message.role|lower == 'chatbot' %}\n<|START_OF_TURN_TOKEN|><|CHATBOT_TOKEN|><|START_RESPONSE|>{{message.content}}<|END_RESPONSE|><|END_OF_TURN_TOKEN|>\n {%- endif %}\n{%- endfor %}<|START_OF_TURN_TOKEN|><|CHATBOT_TOKEN|>{%- if add_generation_prompt -%}<|START_RESPONSE|>{%- endif %}\n{% endif %}"
+ },
+ {
+ "name": "tool_use",
+ "template": "{{ bos_token }}{%- macro document_turn(documents) -%}\n{# format documents into chat turn #}\n<|START_OF_TURN_TOKEN|><|CHATBOT_TOKEN|><|START_THINKING|>I will look through the document to address the users needs.<|END_THINKING|><|START_ACTION|>[\n {\"tool_call_id\": \"0\", \"tool_name\": \"direct-injected-document\", \"parameters\": {}}\n]<|END_ACTION|><|END_OF_TURN_TOKEN|><|START_OF_TURN_TOKEN|><|SYSTEM_TOKEN|><|START_TOOL_RESULT|>[\n {\n \"tool_call_id\": \"0\",\n \"results\": {\n{% for doc in documents %}\n \"{{ loop.index0 }}\": {{doc|tojson}}{% if not loop.last %},\n {% endif %}\n{% endfor %}\n\n },\n \"is_error\": null\n }\n]<|END_TOOL_RESULT|><|END_OF_TURN_TOKEN|>{%- endmacro %}\n{%- macro tool_call_id_to_int(messages, tool_call_id) %}\n{%- set counter = namespace(value=0) %}\n{%- set tool_call_id_seen = namespace(value=false) %}\n{%- for msg in messages %}\n {%- if msg.tool_calls %}\n {%- for tool_call in msg.tool_calls %}\n {%- if tool_call.id == tool_call_id and not tool_call_id_seen.value -%}\n {{ counter.value }}\n {%- set tool_call_id_seen.value = true %}\n {%- endif %}\n {%- set counter.value = counter.value + 1 %}\n {%- endfor %}\n {%- endif %}\n{%- endfor %}\n{%- endmacro %}\n{%- macro format_tool_message(messages, tool_msg) -%}\n{# format tool message #}\n {\n \"tool_call_id\": \"{{ tool_call_id_to_int(messages, tool_msg.tool_call_id) }}\",\n \"results\": {\n \"0\": {{ tool_msg.content|tojson }}\n },\n \"is_error\": null\n }\n{%- endmacro -%}\n{%- if messages and messages[0]['role']|lower == 'system' %}{%- set developer_preamble = messages[0]['content'] %}{% endif %}\n{%- set tool_idx = namespace(value=0) %}\n{%- set tool_ids_seen = namespace(value=[]) %}\n{%- set sent_documents = namespace(value=false) %}\n<|START_OF_TURN_TOKEN|><|SYSTEM_TOKEN|># System Preamble\nYou are in contextual safety mode. You will reject requests to generate child sexual abuse material and child exploitation material in your responses. You will accept to provide information and creative content related to violence, hate, misinformation or sex, but you will not provide any content that could directly or indirectly lead to harmful outcomes.\n\nYour information cutoff date is June 2024.\n\nYou have been trained on data in English, French, Spanish, Italian, German, Portuguese, Japanese, Korean, Modern Standard Arabic, Mandarin, Russian, Indonesian, Turkish, Dutch, Polish, Persian, Vietnamese, Czech, Hindi, Ukrainian, Romanian, Greek and Hebrew but have the ability to speak many more languages.\n{% if tools or documents %}\n\nYou have been trained to have advanced reasoning and tool-use capabilities and you should make best use of these skills to serve user's requests.\n\n## Tool Use\nThink about how you can make best use of the provided tools to help with the task and come up with a high level plan that you will execute first.\n\n0. Start by writing <|START_THINKING|> followed by a detailed step by step plan of how you will solve the problem. For each step explain your thinking fully and give details of required tool calls (if needed). Unless specified otherwise, you write your plan in natural language. When you finish, close it out with <|END_THINKING|>.\n You can optionally choose to skip this step when the user request is so straightforward to address that only a trivial plan would be needed.\n NOTE: You MUST skip this step when you are directly responding to the user's request without using any tools.\n\nThen carry out your plan by repeatedly executing the following steps.\n1. Action: write <|START_ACTION|> followed by a list of JSON-formatted tool calls, with each one containing \"tool_name\" and \"parameters\" fields.\n When there are multiple tool calls which are completely independent of each other (i.e. they can be executed in parallel), you should list them out all together in one step. When you finish, close it out with <|END_ACTION|>.\n2. Observation: you will then receive results of those tool calls in JSON format in the very next turn, wrapped around by <|START_TOOL_RESULT|> and <|END_TOOL_RESULT|>. Carefully observe those results and think about what to do next. Note that these results will be provided to you in a separate turn. NEVER hallucinate results.\n Every tool call produces a list of results (when a tool call produces no result or a single result, it'll still get wrapped inside a list). Each result is clearly linked to its originating tool call via its \"tool_call_id\".\n3. Reflection: start the next turn by writing <|START_THINKING|> followed by what you've figured out so far, any changes you need to make to your plan, and what you will do next. When you finish, close it out with <|END_THINKING|>.\n You can optionally choose to skip this step when everything is going according to plan and no special pieces of information or reasoning chains need to be recorded.\n NOTE: You MUST skip this step when you are done with tool-use actions and are ready to respond to the user.\n\nYou can repeat the above 3 steps multiple times (could be 0 times too if no suitable tool calls are available or needed), until you decide it's time to finally respond to the user.\n\n4. Response: then break out of the loop and write <|START_RESPONSE|> followed by a piece of text which serves as a response to the user's last request. Use all previous tool calls and results to help you when formulating your response. When you finish, close it out with <|END_RESPONSE|>.\n{% if enable_citations %}\n\n## Grounding\nImportantly, note that \"Reflection\" and \"Response\" above can be grounded.\nGrounding means you associate pieces of texts (called \"spans\") with those specific tool results that support them (called \"sources\"). And you use a pair of tags \"\" and \"\" to indicate when a span can be grounded onto a list of sources, listing them out in the closing tag. Sources from the same tool call are grouped together and listed as \"{tool_call_id}:[{list of result indices}]\", before they are joined together by \",\". E.g., \"span\" means that \"span\" is supported by result 1 and 2 from \"tool_call_id=0\" as well as result 0 from \"tool_call_id=1\".\n{% endif %}\n\n## Available Tools\nHere is the list of tools that you have available to you.\nYou can ONLY use the tools listed here. When a tool is not listed below, it is NOT available and you should NEVER attempt to use it.\nEach tool is represented as a JSON object with fields like \"name\", \"description\", \"parameters\" (per JSON Schema), and optionally, \"responses\" (per JSON Schema).\n\n```json\n[\n{% if documents %}\n {\"name\": \"direct-injected-document\", \"description\": \"This is a special tool to directly inject user-uploaded documents into the chat as additional context. DO NOT use this tool by yourself!\", \"parameters\": {\"type\": \"object\", \"properties\": {}, \"required\": []}, \"responses\": {\"200\": {\"description\": \"Successfully returned a list of chunked text snippets from the directly uploaded documents.\", \"content\": {\"application/json\": {\"schema\": {\"type\": \"array\", \"items\": {\"type\": \"object\", \"required\": [\"url\", \"snippet\"], \"properties\": {\"url\": {\"type\": \"string\", \"description\": \"The url of the uploaded document.\"}, \"snippet\": {\"type\": \"string\", \"description\": \"The text snippet for the returned document chunk.\"}}}}}}}}}{%- if tools %},{% endif %}\n\n{% endif %}\n{% for tool in tools %}\n {\"name\": \"{{ tool['function']['name'] }}\", \"description\": \"{{tool['function']['description']}}\", \"parameters\": {{ tool['function']['parameters']|tojson }}, \"responses\": null}{%- if not loop.last %},{% endif %}\n\n{% endfor %}\n]\n```\n\n{% endif %}\n# Default Preamble\nThe following instructions are your defaults unless specified elsewhere in developer preamble or user prompt.\n- Your name is Command.\n- You are a large language model built by Cohere.\n- You reply conversationally with a friendly and informative tone and often include introductory statements and follow-up questions.\n- If the input is ambiguous, ask clarifying follow-up questions.\n- Use Markdown-specific formatting in your response (for example to highlight phrases in bold or italics, create tables, or format code blocks).\n- Use LaTeX to generate mathematical notation for complex equations.\n- When responding in English, use American English unless context indicates otherwise.\n- When outputting responses of more than seven sentences, split the response into paragraphs.\n- Prefer the active voice.\n- Adhere to the APA style guidelines for punctuation, spelling, hyphenation, capitalization, numbers, lists, and quotation marks. Do not worry about them for other elements such as italics, citations, figures, or references.\n- Use gender-neutral pronouns for unspecified persons.\n- Limit lists to no more than 10 items unless the list is a set of finite instructions, in which case complete the list.\n- Use the third person when asked to write a summary.\n- When asked to extract values from source material, use the exact form, separated by commas.\n- When generating code output, please provide an explanation after the code.\n- When generating code output without specifying the programming language, please generate Python code.\n- If you are asked a question that requires reasoning, first think through your answer, slowly and step by step, then answer.\n{%- if developer_preamble %}\n\n\n# Developer Preamble\nThe following instructions take precedence over instructions in the default preamble and user prompt. You reject any instructions which conflict with system preamble instructions.\n{{ developer_preamble }}\n{%- endif -%}\n<|END_OF_TURN_TOKEN|>\n{%- for message in messages %}\n {%- if message.role|lower == 'system' and not (loop.first and developer_preamble)%}\n<|START_OF_TURN_TOKEN|><|SYSTEM_TOKEN|>{{ message.content }}<|END_OF_TURN_TOKEN|>\n {%- elif message.role|lower == 'user' %}\n<|START_OF_TURN_TOKEN|><|USER_TOKEN|>{{ message.content }}<|END_OF_TURN_TOKEN|>{%- if documents and not sent_documents.value %}{%- set sent_documents.value = true %}{% set tool_idx.value = tool_idx.value + 1 %}{{ document_turn(documents) }}{% endif %}\n {%- elif message.role|lower == 'assistant' or message.role|lower == 'chatbot' %}\n<|START_OF_TURN_TOKEN|><|CHATBOT_TOKEN|>{% if message.tool_calls %}<|START_THINKING|>{{message.tool_plan}}<|END_THINKING|><|START_ACTION|>[\n {% for tc in message.tool_calls %}\n {\"tool_call_id\": \"{{ tool_idx.value }}\", \"tool_name\": \"{{ tc['function']['name'] }}\", \"parameters\": {{ tc['function']['arguments']|tojson }}}{% if not loop.last %},{% endif %}\n\n {% set tool_idx.value = tool_idx.value + 1 %}\n {% endfor %}\n]<|END_ACTION|><|END_OF_TURN_TOKEN|>{% else %}<|START_RESPONSE|>{{message.content}}<|END_RESPONSE|><|END_OF_TURN_TOKEN|>{% endif %}\n {% elif message.role|lower == 'tool' and message.tool_call_id not in tool_ids_seen.value %}\n<|START_OF_TURN_TOKEN|><|SYSTEM_TOKEN|><|START_TOOL_RESULT|>[\n{{ format_tool_message(messages, message) }}\n {%- for msg in messages[loop.index0 + 1:] %}\n {%- if msg.role|lower == 'tool' %},\n{{ format_tool_message(messages, msg) }}\n {%- set tool_ids_seen.value = tool_ids_seen.value + [msg.tool_call_id] %}\n {%- else %}\n {%- break %}\n {%- endif %}\n {%- endfor %}\n\n]<|END_TOOL_RESULT|><|END_OF_TURN_TOKEN|>\n {%- endif %}\n{%- endfor %}<|START_OF_TURN_TOKEN|><|CHATBOT_TOKEN|>"
+ },
+ {
+ "name": "rag",
+ "template": "{{ bos_token }}{% set tools = [] %}\n{%- macro document_turn(documents) -%}\n{# format documents into chat turn #}\n<|START_OF_TURN_TOKEN|><|CHATBOT_TOKEN|><|START_THINKING|>I will look through the document to address the users needs.<|END_THINKING|><|START_ACTION|>[\n {\"tool_call_id\": \"0\", \"tool_name\": \"direct-injected-document\", \"parameters\": {}}\n]<|END_ACTION|><|END_OF_TURN_TOKEN|><|START_OF_TURN_TOKEN|><|SYSTEM_TOKEN|><|START_TOOL_RESULT|>[\n {\n \"tool_call_id\": \"0\",\n \"results\": {\n{% for doc in documents %}\n \"{{ loop.index0 }}\": {{doc|tojson}}{% if not loop.last %},\n {% endif %}\n{% endfor %}\n\n },\n \"is_error\": null\n }\n]<|END_TOOL_RESULT|><|END_OF_TURN_TOKEN|>{%- endmacro %}\n{%- macro tool_call_id_to_int(messages, tool_call_id) %}\n{%- set counter = namespace(value=0) %}\n{%- set tool_call_id_seen = namespace(value=false) %}\n{%- for msg in messages %}\n {%- if msg.tool_calls %}\n {%- for tool_call in msg.tool_calls %}\n {%- if tool_call.id == tool_call_id and not tool_call_id_seen.value -%}\n {{ counter.value }}\n {%- set tool_call_id_seen.value = true %}\n {%- endif %}\n {%- set counter.value = counter.value + 1 %}\n {%- endfor %}\n {%- endif %}\n{%- endfor %}\n{%- endmacro %}\n{%- macro format_tool_message(messages, tool_msg) -%}\n{# format tool message #}\n {\n \"tool_call_id\": \"{{ tool_call_id_to_int(messages, tool_msg.tool_call_id) }}\",\n \"results\": {\n \"0\": {{ tool_msg.content|tojson }}\n },\n \"is_error\": null\n }\n{%- endmacro -%}\n{%- if messages and messages[0]['role']|lower == 'system' %}{%- set developer_preamble = messages[0]['content'] %}{% endif %}\n{%- set tool_idx = namespace(value=0) %}\n{%- set tool_ids_seen = namespace(value=[]) %}\n{%- set sent_documents = namespace(value=false) %}\n<|START_OF_TURN_TOKEN|><|SYSTEM_TOKEN|># System Preamble\nYou are in contextual safety mode. You will reject requests to generate child sexual abuse material and child exploitation material in your responses. You will accept to provide information and creative content related to violence, hate, misinformation or sex, but you will not provide any content that could directly or indirectly lead to harmful outcomes.\n\nYour information cutoff date is June 2024.\n\nYou have been trained on data in English, French, Spanish, Italian, German, Portuguese, Japanese, Korean, Modern Standard Arabic, Mandarin, Russian, Indonesian, Turkish, Dutch, Polish, Persian, Vietnamese, Czech, Hindi, Ukrainian, Romanian, Greek and Hebrew but have the ability to speak many more languages.\n{% if tools or documents %}\n\nYou have been trained to have advanced reasoning and tool-use capabilities and you should make best use of these skills to serve user's requests.\n\n## Tool Use\nThink about how you can make best use of the provided tools to help with the task and come up with a high level plan that you will execute first.\n\n0. Start by writing <|START_THINKING|> followed by a detailed step by step plan of how you will solve the problem. For each step explain your thinking fully and give details of required tool calls (if needed). Unless specified otherwise, you write your plan in natural language. When you finish, close it out with <|END_THINKING|>.\n You can optionally choose to skip this step when the user request is so straightforward to address that only a trivial plan would be needed.\n NOTE: You MUST skip this step when you are directly responding to the user's request without using any tools.\n\nThen carry out your plan by repeatedly executing the following steps.\n1. Action: write <|START_ACTION|> followed by a list of JSON-formatted tool calls, with each one containing \"tool_name\" and \"parameters\" fields.\n When there are multiple tool calls which are completely independent of each other (i.e. they can be executed in parallel), you should list them out all together in one step. When you finish, close it out with <|END_ACTION|>.\n2. Observation: you will then receive results of those tool calls in JSON format in the very next turn, wrapped around by <|START_TOOL_RESULT|> and <|END_TOOL_RESULT|>. Carefully observe those results and think about what to do next. Note that these results will be provided to you in a separate turn. NEVER hallucinate results.\n Every tool call produces a list of results (when a tool call produces no result or a single result, it'll still get wrapped inside a list). Each result is clearly linked to its originating tool call via its \"tool_call_id\".\n3. Reflection: start the next turn by writing <|START_THINKING|> followed by what you've figured out so far, any changes you need to make to your plan, and what you will do next. When you finish, close it out with <|END_THINKING|>.\n You can optionally choose to skip this step when everything is going according to plan and no special pieces of information or reasoning chains need to be recorded.\n NOTE: You MUST skip this step when you are done with tool-use actions and are ready to respond to the user.\n\nYou can repeat the above 3 steps multiple times (could be 0 times too if no suitable tool calls are available or needed), until you decide it's time to finally respond to the user.\n\n4. Response: then break out of the loop and write <|START_RESPONSE|> followed by a piece of text which serves as a response to the user's last request. Use all previous tool calls and results to help you when formulating your response. When you finish, close it out with <|END_RESPONSE|>.\n{% if enable_citations %}\n\n## Grounding\nImportantly, note that \"Reflection\" and \"Response\" above can be grounded.\nGrounding means you associate pieces of texts (called \"spans\") with those specific tool results that support them (called \"sources\"). And you use a pair of tags \"\" and \"\" to indicate when a span can be grounded onto a list of sources, listing them out in the closing tag. Sources from the same tool call are grouped together and listed as \"{tool_call_id}:[{list of result indices}]\", before they are joined together by \",\". E.g., \"span\" means that \"span\" is supported by result 1 and 2 from \"tool_call_id=0\" as well as result 0 from \"tool_call_id=1\".\n{% endif %}\n\n## Available Tools\nHere is the list of tools that you have available to you.\nYou can ONLY use the tools listed here. When a tool is not listed below, it is NOT available and you should NEVER attempt to use it.\nEach tool is represented as a JSON object with fields like \"name\", \"description\", \"parameters\" (per JSON Schema), and optionally, \"responses\" (per JSON Schema).\n\n```json\n[\n{% if documents %}\n {\"name\": \"direct-injected-document\", \"description\": \"This is a special tool to directly inject user-uploaded documents into the chat as additional context. DO NOT use this tool by yourself!\", \"parameters\": {\"type\": \"object\", \"properties\": {}, \"required\": []}, \"responses\": {\"200\": {\"description\": \"Successfully returned a list of chunked text snippets from the directly uploaded documents.\", \"content\": {\"application/json\": {\"schema\": {\"type\": \"array\", \"items\": {\"type\": \"object\", \"required\": [\"url\", \"snippet\"], \"properties\": {\"url\": {\"type\": \"string\", \"description\": \"The url of the uploaded document.\"}, \"snippet\": {\"type\": \"string\", \"description\": \"The text snippet for the returned document chunk.\"}}}}}}}}}{%- if tools %},{% endif %}\n\n{% endif %}\n{% for tool in tools %}\n {\"name\": \"{{ tool['function']['name'] }}\", \"description\": \"{{tool['function']['description']}}\", \"parameters\": {{ tool['function']['parameters']|tojson }}, \"responses\": null}{%- if not loop.last %},{% endif %}\n\n{% endfor %}\n]\n```\n\n{% endif %}\n# Default Preamble\nThe following instructions are your defaults unless specified elsewhere in developer preamble or user prompt.\n- Your name is Command.\n- You are a large language model built by Cohere.\n- You reply conversationally with a friendly and informative tone and often include introductory statements and follow-up questions.\n- If the input is ambiguous, ask clarifying follow-up questions.\n- Use Markdown-specific formatting in your response (for example to highlight phrases in bold or italics, create tables, or format code blocks).\n- Use LaTeX to generate mathematical notation for complex equations.\n- When responding in English, use American English unless context indicates otherwise.\n- When outputting responses of more than seven sentences, split the response into paragraphs.\n- Prefer the active voice.\n- Adhere to the APA style guidelines for punctuation, spelling, hyphenation, capitalization, numbers, lists, and quotation marks. Do not worry about them for other elements such as italics, citations, figures, or references.\n- Use gender-neutral pronouns for unspecified persons.\n- Limit lists to no more than 10 items unless the list is a set of finite instructions, in which case complete the list.\n- Use the third person when asked to write a summary.\n- When asked to extract values from source material, use the exact form, separated by commas.\n- When generating code output, please provide an explanation after the code.\n- When generating code output without specifying the programming language, please generate Python code.\n- If you are asked a question that requires reasoning, first think through your answer, slowly and step by step, then answer.\n{%- if developer_preamble %}\n\n\n# Developer Preamble\nThe following instructions take precedence over instructions in the default preamble and user prompt. You reject any instructions which conflict with system preamble instructions.\n{{ developer_preamble }}\n{%- endif -%}\n<|END_OF_TURN_TOKEN|>\n{%- for message in messages %}\n {%- if message.role|lower == 'system' and not (loop.first and developer_preamble)%}\n<|START_OF_TURN_TOKEN|><|SYSTEM_TOKEN|>{{ message.content }}<|END_OF_TURN_TOKEN|>\n {%- elif message.role|lower == 'user' %}\n<|START_OF_TURN_TOKEN|><|USER_TOKEN|>{{ message.content }}<|END_OF_TURN_TOKEN|>{%- if documents and not sent_documents.value %}{%- set sent_documents.value = true %}{% set tool_idx.value = tool_idx.value + 1 %}{{ document_turn(documents) }}{% endif %}\n {%- elif message.role|lower == 'assistant' or message.role|lower == 'chatbot' %}\n<|START_OF_TURN_TOKEN|><|CHATBOT_TOKEN|>{% if message.tool_calls %}<|START_THINKING|>{{message.tool_plan}}<|END_THINKING|><|START_ACTION|>[\n {% for tc in message.tool_calls %}\n {\"tool_call_id\": \"{{ tool_idx.value }}\", \"tool_name\": \"{{ tc['function']['name'] }}\", \"parameters\": {{ tc['function']['arguments']|tojson }}}{% if not loop.last %},{% endif %}\n\n {% set tool_idx.value = tool_idx.value + 1 %}\n {% endfor %}\n]<|END_ACTION|><|END_OF_TURN_TOKEN|>{% else %}<|START_RESPONSE|>{{message.content}}<|END_RESPONSE|><|END_OF_TURN_TOKEN|>{% endif %}\n {% elif message.role|lower == 'tool' and message.tool_call_id not in tool_ids_seen.value %}\n<|START_OF_TURN_TOKEN|><|SYSTEM_TOKEN|><|START_TOOL_RESULT|>[\n{{ format_tool_message(messages, message) }}\n {%- for msg in messages[loop.index0 + 1:] %}\n {%- if msg.role|lower == 'tool' %},\n{{ format_tool_message(messages, msg) }}\n {%- set tool_ids_seen.value = tool_ids_seen.value + [msg.tool_call_id] %}\n {%- else %}\n {%- break %}\n {%- endif %}\n {%- endfor %}\n\n]<|END_TOOL_RESULT|><|END_OF_TURN_TOKEN|>\n {%- endif %}\n{%- endfor %}<|START_OF_TURN_TOKEN|><|CHATBOT_TOKEN|>"
+ }
+ ],
+ "added_tokens_decoder": {
+ "0": {
+ "content": "",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ },
+ "1": {
+ "content": "",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ },
+ "2": {
+ "content": "",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ },
+ "3": {
+ "content": "",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ },
+ "4": {
+ "content": "",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ },
+ "255000": {
+ "content": "<|START_OF_TURN_TOKEN|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": false
+ },
+ "255001": {
+ "content": "<|END_OF_TURN_TOKEN|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": false
+ },
+ "255002": {
+ "content": "<|USER_TOKEN|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": false
+ },
+ "255003": {
+ "content": "<|CHATBOT_TOKEN|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": false
+ },
+ "255004": {
+ "content": "<|SYSTEM_TOKEN|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": false
+ },
+ "255005": {
+ "content": "<|NEW_FILE|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ },
+ "255006": {
+ "content": "<|BEGINNING_OF_PREFIX_FIM_TOKEN|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ },
+ "255007": {
+ "content": "<|BEGINNING_OF_MIDDLE_FIM_TOKEN|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ },
+ "255008": {
+ "content": "<|BEGINNING_OF_SUFFIX_FIM_TOKEN|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ },
+ "255009": {
+ "content": "<|END_OF_MIDDLE_FIM_TOKEN|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ },
+ "255010": {
+ "content": "<|START_THINKING|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": false
+ },
+ "255011": {
+ "content": "<|END_THINKING|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": false
+ },
+ "255012": {
+ "content": "<|START_TEXT|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": false
+ },
+ "255013": {
+ "content": "<|END_TEXT|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": false
+ },
+ "255014": {
+ "content": "<|START_ACTION|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": false
+ },
+ "255015": {
+ "content": "<|END_ACTION|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": false
+ },
+ "255016": {
+ "content": "<|START_TOOL_RESULT|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": false
+ },
+ "255017": {
+ "content": "<|END_TOOL_RESULT|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": false
+ },
+ "255018": {
+ "content": "<|USER_0_TOKEN|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": false
+ },
+ "255019": {
+ "content": "<|USER_1_TOKEN|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": false
+ },
+ "255020": {
+ "content": "<|USER_2_TOKEN|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": false
+ },
+ "255021": {
+ "content": "<|USER_3_TOKEN|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": false
+ },
+ "255022": {
+ "content": "<|USER_4_TOKEN|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": false
+ },
+ "255023": {
+ "content": "<|USER_5_TOKEN|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": false
+ },
+ "255024": {
+ "content": "<|USER_6_TOKEN|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": false
+ },
+ "255025": {
+ "content": "<|USER_7_TOKEN|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": false
+ },
+ "255026": {
+ "content": "<|USER_8_TOKEN|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": false
+ },
+ "255027": {
+ "content": "<|USER_9_TOKEN|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": false
+ },
+ "255028": {
+ "content": "<|START_OF_IMG|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ },
+ "255029": {
+ "content": "<|END_OF_IMG|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ },
+ "255030": {
+ "content": "<|IMG_LINE_BREAK|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ },
+ "255031": {
+ "content": "<|IMG_PATCH|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ }
+ }
+}
\ No newline at end of file